//
// Generated by NVIDIA NVVM Compiler
//
// Compiler Build ID: CL-31968024
// Cuda compilation tools, release 12.0, V12.0.76
// Based on NVVM 7.0.1
//

.version 8.0
.target sm_52
.address_size 64

	// .globl	__raygen__oxMain
.const .align 16 .b8 params[384];
.global .align 4 .b8 __cudart_i2opi_f[24] = {65, 144, 67, 60, 153, 149, 98, 219, 192, 221, 52, 245, 209, 87, 39, 252, 41, 21, 68, 78, 110, 131, 249, 162};

.visible .entry __raygen__oxMain()
{
	.local .align 4 .b8 	__local_depot0[28];
	.reg .b64 	%SP;
	.reg .b64 	%SPL;
	.reg .pred 	%p<177>;
	.reg .b16 	%rs<17>;
	.reg .f32 	%f<1477>;
	.reg .b32 	%r<766>;
	.reg .f64 	%fd<13>;
	.reg .b64 	%rd<179>;


	mov.u64 	%SPL, __local_depot0;
	add.u64 	%rd1, %SPL, 0;
	// begin inline asm
	call (%r155), _optix_get_launch_index_x, ();
	// end inline asm
	// begin inline asm
	call (%r156), _optix_get_launch_index_y, ();
	// end inline asm
	// begin inline asm
	call (%r158), _optix_get_launch_dimension_x, ();
	// end inline asm
	// begin inline asm
	call (%r159), _optix_get_launch_dimension_y, ();
	// end inline asm
	ld.const.v4.u32 	{%r161, %r162, %r163, %r164}, [params+352];
	add.s32 	%r169, %r161, %r155;
	and.b32  	%r170, %r169, 255;
	add.s32 	%r171, %r162, %r156;
	and.b32  	%r172, %r171, 255;
	add.s32 	%r173, %r163, %r155;
	and.b32  	%r174, %r173, 255;
	add.s32 	%r175, %r164, %r156;
	and.b32  	%r176, %r175, 255;
	ld.const.u64 	%rd47, [params+192];
	cvta.to.global.u64 	%rd48, %rd47;
	ld.const.u32 	%r177, [params+184];
	mad.lo.s32 	%r178, %r177, %r172, %r170;
	mul.wide.u32 	%rd49, %r178, 3;
	add.s64 	%rd50, %rd48, %rd49;
	ld.global.u8 	%rs3, [%rd50];
	cvt.rn.f32.u16 	%f367, %rs3;
	div.rn.f32 	%f1, %f367, 0f437F0000;
	ld.global.u8 	%rs4, [%rd50+1];
	cvt.rn.f32.u16 	%f368, %rs4;
	div.rn.f32 	%f2, %f368, 0f437F0000;
	ld.global.u8 	%rs5, [%rd50+2];
	cvt.rn.f32.u16 	%f369, %rs5;
	div.rn.f32 	%f3, %f369, 0f437F0000;
	mad.lo.s32 	%r179, %r177, %r176, %r174;
	mul.wide.u32 	%rd51, %r179, 3;
	add.s64 	%rd2, %rd48, %rd51;
	ld.const.u32 	%r5, [params+340];
	setp.eq.s32 	%p5, %r5, 0;
	@%p5 bra 	$L__BB0_26;

	ld.global.u8 	%rs6, [%rd2];
	cvt.rn.f32.u16 	%f370, %rs6;
	div.rn.f32 	%f371, %f370, 0f437F0000;
	ld.global.u8 	%rs7, [%rd2+1];
	cvt.rn.f32.u16 	%f372, %rs7;
	div.rn.f32 	%f373, %f372, 0f437F0000;
	ld.const.u64 	%rd52, [params+144];
	cvta.to.global.u64 	%rd53, %rd52;
	ld.const.u32 	%r180, [params+136];
	mad.lo.s32 	%r181, %r180, %r156, %r155;
	mul.wide.u32 	%rd54, %r181, 12;
	add.s64 	%rd55, %rd53, %rd54;
	ld.global.f32 	%f1386, [%rd55];
	ld.global.f32 	%f1387, [%rd55+4];
	ld.global.f32 	%f1388, [%rd55+8];
	ld.const.u64 	%rd56, [params+160];
	cvta.to.global.u64 	%rd57, %rd56;
	ld.const.u32 	%r182, [params+152];
	mad.lo.s32 	%r183, %r182, %r156, %r155;
	mul.wide.u32 	%rd58, %r183, 12;
	add.s64 	%rd59, %rd57, %rd58;
	ld.global.f32 	%f7, [%rd59];
	abs.f32 	%f374, %f7;
	ld.global.f32 	%f8, [%rd59+8];
	abs.f32 	%f375, %f8;
	setp.gt.f32 	%p6, %f374, %f375;
	ld.global.f32 	%f9, [%rd59+4];
	neg.f32 	%f376, %f9;
	neg.f32 	%f377, %f8;
	selp.f32 	%f378, 0f00000000, %f9, %p6;
	selp.f32 	%f379, %f7, %f377, %p6;
	selp.f32 	%f380, %f376, 0f00000000, %p6;
	mul.f32 	%f381, %f379, %f379;
	fma.rn.f32 	%f382, %f380, %f380, %f381;
	fma.rn.f32 	%f383, %f378, %f378, %f382;
	sqrt.rn.f32 	%f384, %f383;
	rcp.rn.f32 	%f385, %f384;
	mul.f32 	%f10, %f380, %f385;
	mul.f32 	%f11, %f379, %f385;
	mul.f32 	%f12, %f378, %f385;
	sqrt.rn.f32 	%f13, %f371;
	mul.f32 	%f14, %f373, 0f40C90FDB;
	mul.f32 	%f386, %f14, 0f3F22F983;
	cvt.rni.s32.f32 	%r749, %f386;
	cvt.rn.f32.s32 	%f387, %r749;
	mov.f32 	%f388, 0fBFC90FDA;
	fma.rn.f32 	%f389, %f387, %f388, %f14;
	mov.f32 	%f390, 0fB3A22168;
	fma.rn.f32 	%f391, %f387, %f390, %f389;
	mov.f32 	%f392, 0fA7C234C5;
	fma.rn.f32 	%f1380, %f387, %f392, %f391;
	abs.f32 	%f16, %f14;
	setp.ltu.f32 	%p7, %f16, 0f47CE4780;
	mov.u32 	%r745, %r749;
	mov.f32 	%f1377, %f1380;
	@%p7 bra 	$L__BB0_9;

	setp.eq.f32 	%p8, %f16, 0f7F800000;
	@%p8 bra 	$L__BB0_8;
	bra.uni 	$L__BB0_3;

$L__BB0_8:
	mov.f32 	%f395, 0f00000000;
	mul.rn.f32 	%f1377, %f14, %f395;
	mov.u32 	%r745, 0;
	bra.uni 	$L__BB0_9;

$L__BB0_26:
	ld.const.v4.f32 	{%f445, %f1386, %f1387, %f1388}, [params+304];
	cvt.rn.f32.u32 	%f450, %r159;
	cvt.rn.f32.u32 	%f451, %r158;
	div.rn.f32 	%f452, %f451, %f450;
	cvt.rn.f32.u32 	%f453, %r155;
	add.f32 	%f454, %f1, %f453;
	div.rn.f32 	%f455, %f454, %f451;
	cvt.rn.f32.u32 	%f456, %r156;
	add.f32 	%f457, %f2, %f456;
	div.rn.f32 	%f458, %f457, %f450;
	fma.rn.f32 	%f459, %f455, 0f40000000, 0fBF800000;
	fma.rn.f32 	%f460, %f458, 0f40000000, 0fBF800000;
	ld.const.f32 	%f461, [params+320];
	mul.f32 	%f462, %f452, %f461;
	ld.const.v4.f32 	{%f463, %f464, %f465, %f466}, [params+272];
	mul.f32 	%f471, %f459, %f463;
	mul.f32 	%f472, %f459, %f464;
	mul.f32 	%f473, %f459, %f465;
	ld.const.v4.f32 	{%f474, %f475, %f476, %f477}, [params+288];
	fma.rn.f32 	%f482, %f462, %f471, %f476;
	fma.rn.f32 	%f483, %f462, %f472, %f477;
	fma.rn.f32 	%f484, %f462, %f473, %f445;
	mul.f32 	%f485, %f460, %f466;
	mul.f32 	%f486, %f460, %f474;
	mul.f32 	%f487, %f460, %f475;
	fma.rn.f32 	%f488, %f461, %f485, %f482;
	fma.rn.f32 	%f489, %f461, %f486, %f483;
	fma.rn.f32 	%f490, %f461, %f487, %f484;
	mul.f32 	%f491, %f489, %f489;
	fma.rn.f32 	%f492, %f488, %f488, %f491;
	fma.rn.f32 	%f493, %f490, %f490, %f492;
	sqrt.rn.f32 	%f494, %f493;
	rcp.rn.f32 	%f495, %f494;
	mul.f32 	%f1383, %f488, %f495;
	mul.f32 	%f1384, %f489, %f495;
	mul.f32 	%f1385, %f495, %f490;
	bra.uni 	$L__BB0_27;

$L__BB0_3:
	mov.b32 	%r7, %f14;
	bfe.u32 	%r185, %r7, 23, 8;
	add.s32 	%r8, %r185, -128;
	shl.b32 	%r186, %r7, 8;
	or.b32  	%r9, %r186, -2147483648;
	shr.u32 	%r10, %r8, 5;
	mov.u64 	%rd163, 0;
	mov.u32 	%r742, 0;
	mov.u64 	%rd162, __cudart_i2opi_f;
	mov.u64 	%rd161, %rd1;

$L__BB0_4:
	.pragma "nounroll";
	ld.global.nc.u32 	%r187, [%rd162];
	mad.wide.u32 	%rd62, %r187, %r9, %rd163;
	shr.u64 	%rd163, %rd62, 32;
	st.local.u32 	[%rd161], %rd62;
	add.s64 	%rd162, %rd162, 4;
	add.s64 	%rd161, %rd161, 4;
	add.s32 	%r742, %r742, 1;
	setp.ne.s32 	%p9, %r742, 6;
	@%p9 bra 	$L__BB0_4;

	st.local.u32 	[%rd1+24], %rd163;
	mov.u32 	%r188, 4;
	sub.s32 	%r13, %r188, %r10;
	mov.u32 	%r189, 6;
	sub.s32 	%r190, %r189, %r10;
	mul.wide.s32 	%rd63, %r190, 4;
	add.s64 	%rd64, %rd1, %rd63;
	ld.local.u32 	%r743, [%rd64];
	ld.local.u32 	%r744, [%rd64+-4];
	and.b32  	%r16, %r8, 31;
	setp.eq.s32 	%p10, %r16, 0;
	@%p10 bra 	$L__BB0_7;

	mov.u32 	%r191, 32;
	sub.s32 	%r192, %r191, %r16;
	shr.u32 	%r193, %r744, %r192;
	shl.b32 	%r194, %r743, %r16;
	add.s32 	%r743, %r193, %r194;
	mul.wide.s32 	%rd65, %r13, 4;
	add.s64 	%rd66, %rd1, %rd65;
	ld.local.u32 	%r195, [%rd66];
	shr.u32 	%r196, %r195, %r192;
	shl.b32 	%r197, %r744, %r16;
	add.s32 	%r744, %r196, %r197;

$L__BB0_7:
	and.b32  	%r198, %r7, -2147483648;
	shr.u32 	%r199, %r744, 30;
	shl.b32 	%r200, %r743, 2;
	or.b32  	%r201, %r199, %r200;
	shr.u32 	%r202, %r201, 31;
	shr.u32 	%r203, %r743, 30;
	add.s32 	%r204, %r202, %r203;
	neg.s32 	%r205, %r204;
	setp.eq.s32 	%p11, %r198, 0;
	selp.b32 	%r745, %r204, %r205, %p11;
	setp.ne.s32 	%p12, %r202, 0;
	xor.b32  	%r206, %r198, -2147483648;
	selp.b32 	%r207, %r206, %r198, %p12;
	selp.b32 	%r208, -1, 0, %p12;
	xor.b32  	%r209, %r201, %r208;
	shl.b32 	%r210, %r744, 2;
	xor.b32  	%r211, %r210, %r208;
	cvt.u64.u32 	%rd67, %r209;
	cvt.u64.u32 	%rd68, %r211;
	bfi.b64 	%rd69, %rd67, %rd68, 32, 32;
	cvt.rn.f64.s64 	%fd1, %rd69;
	mul.f64 	%fd2, %fd1, 0d3BF921FB54442D19;
	cvt.rn.f32.f64 	%f393, %fd2;
	setp.eq.s32 	%p13, %r207, 0;
	neg.f32 	%f394, %f393;
	selp.f32 	%f1377, %f393, %f394, %p13;

$L__BB0_9:
	add.s32 	%r23, %r745, 1;
	and.b32  	%r24, %r23, 1;
	setp.eq.s32 	%p14, %r24, 0;
	selp.f32 	%f20, %f1377, 0f3F800000, %p14;
	mul.rn.f32 	%f21, %f1377, %f1377;
	mov.f32 	%f1378, 0fB94D4153;
	@%p14 bra 	$L__BB0_11;

	mov.f32 	%f397, 0fBAB607ED;
	mov.f32 	%f398, 0f37CBAC00;
	fma.rn.f32 	%f1378, %f398, %f21, %f397;

$L__BB0_11:
	selp.f32 	%f399, 0f3C0885E4, 0f3D2AAABB, %p14;
	fma.rn.f32 	%f400, %f1378, %f21, %f399;
	selp.f32 	%f401, 0fBE2AAAA8, 0fBEFFFFFF, %p14;
	fma.rn.f32 	%f402, %f400, %f21, %f401;
	mov.f32 	%f403, 0f00000000;
	fma.rn.f32 	%f404, %f21, %f20, %f403;
	fma.rn.f32 	%f1379, %f402, %f404, %f20;
	and.b32  	%r213, %r23, 2;
	setp.eq.s32 	%p16, %r213, 0;
	@%p16 bra 	$L__BB0_13;

	mov.f32 	%f406, 0fBF800000;
	fma.rn.f32 	%f1379, %f1379, %f406, %f403;

$L__BB0_13:
	@%p7 bra 	$L__BB0_21;

	setp.eq.f32 	%p18, %f16, 0f7F800000;
	@%p18 bra 	$L__BB0_20;
	bra.uni 	$L__BB0_15;

$L__BB0_20:
	mov.f32 	%f409, 0f00000000;
	mul.rn.f32 	%f1380, %f14, %f409;
	mov.u32 	%r749, 0;
	bra.uni 	$L__BB0_21;

$L__BB0_15:
	mov.b32 	%r25, %f14;
	bfe.u32 	%r215, %r25, 23, 8;
	add.s32 	%r26, %r215, -128;
	shl.b32 	%r216, %r25, 8;
	or.b32  	%r27, %r216, -2147483648;
	shr.u32 	%r28, %r26, 5;
	mov.u64 	%rd166, 0;
	mov.u32 	%r746, 0;
	mov.u64 	%rd165, __cudart_i2opi_f;
	mov.u64 	%rd164, %rd1;

$L__BB0_16:
	.pragma "nounroll";
	ld.global.nc.u32 	%r217, [%rd165];
	mad.wide.u32 	%rd72, %r217, %r27, %rd166;
	shr.u64 	%rd166, %rd72, 32;
	st.local.u32 	[%rd164], %rd72;
	add.s64 	%rd165, %rd165, 4;
	add.s64 	%rd164, %rd164, 4;
	add.s32 	%r746, %r746, 1;
	setp.ne.s32 	%p19, %r746, 6;
	@%p19 bra 	$L__BB0_16;

	st.local.u32 	[%rd1+24], %rd166;
	mov.u32 	%r218, 4;
	sub.s32 	%r31, %r218, %r28;
	mov.u32 	%r219, 6;
	sub.s32 	%r220, %r219, %r28;
	mul.wide.s32 	%rd73, %r220, 4;
	add.s64 	%rd74, %rd1, %rd73;
	ld.local.u32 	%r747, [%rd74];
	ld.local.u32 	%r748, [%rd74+-4];
	and.b32  	%r34, %r26, 31;
	setp.eq.s32 	%p20, %r34, 0;
	@%p20 bra 	$L__BB0_19;

	mov.u32 	%r221, 32;
	sub.s32 	%r222, %r221, %r34;
	shr.u32 	%r223, %r748, %r222;
	shl.b32 	%r224, %r747, %r34;
	add.s32 	%r747, %r223, %r224;
	mul.wide.s32 	%rd75, %r31, 4;
	add.s64 	%rd76, %rd1, %rd75;
	ld.local.u32 	%r225, [%rd76];
	shr.u32 	%r226, %r225, %r222;
	shl.b32 	%r227, %r748, %r34;
	add.s32 	%r748, %r226, %r227;

$L__BB0_19:
	and.b32  	%r228, %r25, -2147483648;
	shr.u32 	%r229, %r748, 30;
	shl.b32 	%r230, %r747, 2;
	or.b32  	%r231, %r229, %r230;
	shr.u32 	%r232, %r231, 31;
	shr.u32 	%r233, %r747, 30;
	add.s32 	%r234, %r232, %r233;
	neg.s32 	%r235, %r234;
	setp.eq.s32 	%p21, %r228, 0;
	selp.b32 	%r749, %r234, %r235, %p21;
	setp.ne.s32 	%p22, %r232, 0;
	xor.b32  	%r236, %r228, -2147483648;
	selp.b32 	%r237, %r236, %r228, %p22;
	selp.b32 	%r238, -1, 0, %p22;
	xor.b32  	%r239, %r231, %r238;
	shl.b32 	%r240, %r748, 2;
	xor.b32  	%r241, %r240, %r238;
	cvt.u64.u32 	%rd77, %r239;
	cvt.u64.u32 	%rd78, %r241;
	bfi.b64 	%rd79, %rd77, %rd78, 32, 32;
	cvt.rn.f64.s64 	%fd3, %rd79;
	mul.f64 	%fd4, %fd3, 0d3BF921FB54442D19;
	cvt.rn.f32.f64 	%f407, %fd4;
	setp.eq.s32 	%p23, %r237, 0;
	neg.f32 	%f408, %f407;
	selp.f32 	%f1380, %f407, %f408, %p23;

$L__BB0_21:
	mul.f32 	%f30, %f13, %f1379;
	and.b32  	%r41, %r749, 1;
	setp.eq.s32 	%p24, %r41, 0;
	selp.f32 	%f31, %f1380, 0f3F800000, %p24;
	mul.rn.f32 	%f32, %f1380, %f1380;
	mov.f32 	%f1381, 0fB94D4153;
	@%p24 bra 	$L__BB0_23;

	mov.f32 	%f411, 0fBAB607ED;
	mov.f32 	%f412, 0f37CBAC00;
	fma.rn.f32 	%f1381, %f412, %f32, %f411;

$L__BB0_23:
	selp.f32 	%f413, 0f3C0885E4, 0f3D2AAABB, %p24;
	fma.rn.f32 	%f414, %f1381, %f32, %f413;
	selp.f32 	%f415, 0fBE2AAAA8, 0fBEFFFFFF, %p24;
	fma.rn.f32 	%f416, %f414, %f32, %f415;
	mov.f32 	%f417, 0f00000000;
	fma.rn.f32 	%f418, %f32, %f31, %f417;
	fma.rn.f32 	%f1382, %f416, %f418, %f31;
	and.b32  	%r243, %r749, 2;
	setp.eq.s32 	%p26, %r243, 0;
	@%p26 bra 	$L__BB0_25;

	mov.f32 	%f420, 0fBF800000;
	fma.rn.f32 	%f1382, %f1382, %f420, %f417;

$L__BB0_25:
	mul.f32 	%f421, %f30, %f30;
	mov.f32 	%f422, 0f3F800000;
	sub.f32 	%f423, %f422, %f421;
	mul.f32 	%f424, %f13, %f1382;
	mul.f32 	%f425, %f424, %f424;
	sub.f32 	%f426, %f423, %f425;
	max.f32 	%f428, %f417, %f426;
	sqrt.rn.f32 	%f429, %f428;
	mul.f32 	%f430, %f10, %f424;
	mul.f32 	%f431, %f11, %f424;
	mul.f32 	%f432, %f12, %f424;
	mul.f32 	%f433, %f8, %f11;
	mul.f32 	%f434, %f9, %f12;
	sub.f32 	%f435, %f433, %f434;
	fma.rn.f32 	%f436, %f435, %f30, %f430;
	mul.f32 	%f437, %f7, %f12;
	mul.f32 	%f438, %f8, %f10;
	sub.f32 	%f439, %f437, %f438;
	fma.rn.f32 	%f440, %f439, %f30, %f431;
	mul.f32 	%f441, %f9, %f10;
	mul.f32 	%f442, %f7, %f11;
	sub.f32 	%f443, %f441, %f442;
	fma.rn.f32 	%f444, %f443, %f30, %f432;
	fma.rn.f32 	%f1383, %f7, %f429, %f436;
	fma.rn.f32 	%f1384, %f9, %f429, %f440;
	fma.rn.f32 	%f1385, %f8, %f429, %f444;

$L__BB0_27:
	ld.const.u64 	%rd80, [params+176];
	cvta.to.global.u64 	%rd81, %rd80;
	ld.const.u32 	%r244, [params+168];
	mad.lo.s32 	%r245, %r244, %r156, %r155;
	mul.wide.u32 	%rd82, %r245, 12;
	add.s64 	%rd15, %rd81, %rd82;
	ld.global.f32 	%f53, [%rd15+4];
	ld.global.f32 	%f54, [%rd15];
	add.f32 	%f503, %f54, %f53;
	ld.global.f32 	%f55, [%rd15+8];
	add.f32 	%f504, %f503, %f55;
	setp.eq.f32 	%p27, %f504, 0f00000000;
	mov.f32 	%f1389, 0f00000000;
	setp.ne.s32 	%p28, %r5, 0;
	mov.f32 	%f1392, 0fBF800000;
	and.pred  	%p29, %p28, %p27;
	mov.f32 	%f1390, %f1389;
	mov.f32 	%f1391, %f1389;
	mov.f32 	%f1393, %f1389;
	mov.f32 	%f1394, %f1389;
	mov.f32 	%f1395, %f1389;
	@%p29 bra 	$L__BB0_29;

	ld.const.u64 	%rd83, [params+64];
	mov.f32 	%f512, 0f6C4ECB8F;
	mov.f32 	%f513, 0f00000000;
	mov.u32 	%r279, 1;
	mov.u32 	%r282, 2;
	mov.u32 	%r284, 7;
	mov.u32 	%r288, 2139095039;
	mov.u32 	%r291, 1065353216;
	mov.u32 	%r316, 0;
	// begin inline asm
	call(%r246,%r247,%r248,%r249,%r250,%r251,%r252,%r253,%r254,%r255,%r256,%r257,%r258,%r259,%r260,%r261,%r262,%r263,%r264,%r265,%r266,%r267,%r268,%r269,%r270,%r271,%r272,%r273,%r274,%r275,%r276,%r277),_optix_trace_typed_32,(%r316,%rd83,%f1386,%f1387,%f1388,%f1383,%f1384,%f1385,%f513,%f512,%f513,%r279,%r316,%r316,%r282,%r316,%r284,%r316,%r316,%r316,%r288,%r291,%r291,%r291,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316);
	// end inline asm
	mov.b32 	%f1389, %r246;
	mov.b32 	%f1390, %r247;
	mov.b32 	%f1391, %r248;
	mov.b32 	%f1392, %r249;
	mov.b32 	%f1393, %r250;
	mov.b32 	%f1394, %r251;
	mov.b32 	%f1395, %r252;

$L__BB0_29:
	setp.ltu.f32 	%p30, %f1392, 0f00000000;
	@%p30 bra 	$L__BB0_125;
	bra.uni 	$L__BB0_30;

$L__BB0_125:
	selp.u16 	%rs16, 1, 0, %p5;
	mov.f32 	%f1453, 0f00000000;
	mov.f32 	%f1454, %f1453;
	mov.f32 	%f1455, %f1453;
	mov.f32 	%f1456, %f1453;
	mov.f32 	%f1457, %f1453;
	mov.f32 	%f1458, %f1453;
	mov.f32 	%f1459, %f1453;
	mov.f32 	%f1460, %f1453;
	mov.f32 	%f1461, %f1453;
	bra.uni 	$L__BB0_126;

$L__BB0_30:
	fma.rn.f32 	%f514, %f1383, %f1392, %f1386;
	fma.rn.f32 	%f515, %f1384, %f1392, %f1387;
	fma.rn.f32 	%f516, %f1385, %f1392, %f1388;
	mul.f32 	%f517, %f514, 0f3456BF95;
	mul.f32 	%f518, %f515, 0f3456BF95;
	mul.f32 	%f519, %f516, 0f3456BF95;
	abs.f32 	%f520, %f517;
	abs.f32 	%f521, %f518;
	abs.f32 	%f522, %f519;
	max.f32 	%f523, %f520, %f521;
	max.f32 	%f524, %f523, %f522;
	mov.f32 	%f525, 0f38D1B717;
	max.f32 	%f526, %f524, %f525;
	fma.rn.f32 	%f70, %f1389, %f526, %f514;
	fma.rn.f32 	%f71, %f1390, %f526, %f515;
	fma.rn.f32 	%f72, %f1391, %f526, %f516;
	ld.const.u64 	%rd84, [params+144];
	cvta.to.global.u64 	%rd85, %rd84;
	ld.const.u32 	%r317, [params+136];
	mad.lo.s32 	%r318, %r317, %r156, %r155;
	mul.wide.u32 	%rd86, %r318, 12;
	add.s64 	%rd87, %rd85, %rd86;
	st.global.f32 	[%rd87], %f70;
	st.global.f32 	[%rd87+4], %f71;
	st.global.f32 	[%rd87+8], %f72;
	ld.const.u64 	%rd88, [params+160];
	cvta.to.global.u64 	%rd89, %rd88;
	ld.const.u32 	%r319, [params+152];
	mad.lo.s32 	%r320, %r319, %r156, %r155;
	mul.wide.u32 	%rd90, %r320, 12;
	add.s64 	%rd91, %rd89, %rd90;
	st.global.f32 	[%rd91], %f1389;
	st.global.f32 	[%rd91+4], %f1390;
	st.global.f32 	[%rd91+8], %f1391;
	neg.f32 	%f527, %f1393;
	setp.lt.f32 	%p31, %f1393, 0f00000000;
	selp.f32 	%f528, %f527, %f1393, %p31;
	ld.const.f32 	%f529, [params+372];
	selp.f32 	%f530, %f529, 0f3F800000, %p31;
	cvt.rmi.f32.f32 	%f531, %f528;
	sub.f32 	%f532, %f528, %f531;
	cvt.rmi.f32.f32 	%f533, %f1394;
	sub.f32 	%f534, %f1394, %f533;
	cvt.rmi.f32.f32 	%f535, %f1395;
	sub.f32 	%f536, %f1395, %f535;
	mul.f32 	%f1456, %f530, %f532;
	mul.f32 	%f1457, %f530, %f534;
	mul.f32 	%f1458, %f530, %f536;
	mul.f32 	%f1453, %f531, 0f3B808081;
	mul.f32 	%f1454, %f533, 0f3B808081;
	mul.f32 	%f1455, %f535, 0f3B808081;
	setp.lt.s32 	%p32, %r5, 1;
	@%p32 bra 	$L__BB0_32;

	mul.f32 	%f1456, %f54, %f1456;
	mul.f32 	%f1457, %f53, %f1457;
	mul.f32 	%f1458, %f55, %f1458;
	mul.f32 	%f1453, %f54, %f1453;
	mul.f32 	%f1454, %f53, %f1454;
	mul.f32 	%f1455, %f55, %f1455;

$L__BB0_32:
	ld.const.u32 	%r42, [params+200];
	setp.eq.s32 	%p33, %r42, 0;
	mov.f32 	%f1461, 0f00000000;
	mov.f32 	%f1460, %f1461;
	mov.f32 	%f1459, %f1461;
	@%p33 bra 	$L__BB0_96;

	cvt.rn.f32.u32 	%f91, %r42;
	mul.f32 	%f540, %f3, %f91;
	cvt.rzi.u32.f32 	%r321, %f540;
	add.s32 	%r322, %r42, -1;
	min.u32 	%r323, %r321, %r322;
	ld.const.u64 	%rd92, [params+208];
	cvta.to.global.u64 	%rd93, %rd92;
	mul.wide.u32 	%rd94, %r323, 64;
	add.s64 	%rd16, %rd93, %rd94;
	ld.global.v4.f32 	{%f541, %f542, %f543, %f544}, [%rd16];
	ld.global.v4.f32 	{%f545, %f546, %f547, %f548}, [%rd16+16];
	ld.global.u64 	%rd17, [%rd16+48];
	setp.lt.f32 	%p34, %f541, 0f3F800000;
	@%p34 bra 	$L__BB0_65;
	bra.uni 	$L__BB0_34;

$L__BB0_65:
	fma.rn.f32 	%f658, %f542, 0f40000000, 0fBF800000;
	fma.rn.f32 	%f659, %f543, 0f40000000, 0fBF800000;
	abs.f32 	%f660, %f658;
	mov.f32 	%f1417, 0f3F800000;
	sub.f32 	%f661, %f1417, %f660;
	abs.f32 	%f662, %f659;
	sub.f32 	%f663, %f661, %f662;
	neg.f32 	%f664, %f663;
	cvt.sat.f32.f32 	%f665, %f664;
	setp.ge.f32 	%p61, %f658, 0f00000000;
	neg.f32 	%f666, %f665;
	selp.f32 	%f667, %f666, %f665, %p61;
	add.f32 	%f668, %f658, %f667;
	setp.ge.f32 	%p62, %f659, 0f00000000;
	selp.f32 	%f669, %f666, %f665, %p62;
	add.f32 	%f670, %f659, %f669;
	mul.f32 	%f671, %f670, %f670;
	fma.rn.f32 	%f672, %f668, %f668, %f671;
	fma.rn.f32 	%f673, %f663, %f663, %f672;
	sqrt.rn.f32 	%f674, %f673;
	rcp.rn.f32 	%f675, %f674;
	mul.f32 	%f154, %f668, %f675;
	mul.f32 	%f155, %f670, %f675;
	mul.f32 	%f156, %f663, %f675;
	neg.f32 	%f157, %f155;
	neg.f32 	%f158, %f156;
	mul.f32 	%f676, %f1389, %f154;
	mul.f32 	%f677, %f1390, %f157;
	sub.f32 	%f678, %f677, %f676;
	mul.f32 	%f679, %f1391, %f156;
	sub.f32 	%f159, %f678, %f679;
	setp.leu.f32 	%p63, %f159, 0f00000000;
	setp.eq.s64 	%p64, %rd17, 0;
	or.pred  	%p65, %p64, %p63;
	mov.f32 	%f1418, %f1417;
	mov.f32 	%f1419, %f1417;
	mov.f32 	%f1420, %f159;
	@%p65 bra 	$L__BB0_67;

	ld.global.v4.f32 	{%f680, %f681, %f682, %f683}, [%rd16+32];
	abs.f32 	%f684, %f154;
	abs.f32 	%f685, %f156;
	setp.gt.f32 	%p66, %f684, %f685;
	selp.f32 	%f686, %f157, 0f00000000, %p66;
	selp.f32 	%f687, %f154, %f158, %p66;
	selp.f32 	%f688, 0f00000000, %f155, %p66;
	mul.f32 	%f689, %f687, %f687;
	fma.rn.f32 	%f690, %f686, %f686, %f689;
	fma.rn.f32 	%f691, %f688, %f688, %f690;
	sqrt.rn.f32 	%f692, %f691;
	rcp.rn.f32 	%f693, %f692;
	mul.f32 	%f694, %f686, %f693;
	mul.f32 	%f695, %f687, %f693;
	mul.f32 	%f696, %f688, %f693;
	mul.f32 	%f697, %f156, %f695;
	mul.f32 	%f698, %f155, %f696;
	sub.f32 	%f699, %f697, %f698;
	mul.f32 	%f700, %f154, %f696;
	mul.f32 	%f701, %f156, %f694;
	sub.f32 	%f702, %f700, %f701;
	mul.f32 	%f703, %f155, %f694;
	mul.f32 	%f704, %f154, %f695;
	sub.f32 	%f705, %f703, %f704;
	mul.f32 	%f706, %f71, %f702;
	fma.rn.f32 	%f707, %f70, %f699, %f706;
	fma.rn.f32 	%f708, %f72, %f705, %f707;
	fma.rn.f32 	%f711, %f680, %f708, %f682;
	mul.f32 	%f712, %f71, %f695;
	fma.rn.f32 	%f713, %f70, %f694, %f712;
	fma.rn.f32 	%f714, %f72, %f696, %f713;
	fma.rn.f32 	%f717, %f681, %f714, %f683;
	tex.2d.v4.f32.f32 	{%f1417, %f1418, %f1419, %f718}, [%rd17, {%f711, %f717}];
	max.f32 	%f719, %f1417, %f1418;
	max.f32 	%f720, %f719, %f1419;
	mul.f32 	%f1420, %f159, %f720;

$L__BB0_67:
	setp.le.f32 	%p67, %f1420, 0f00000000;
	mov.f32 	%f1430, 0f00000000;
	mov.f32 	%f1431, %f1430;
	mov.f32 	%f1432, %f1430;
	@%p67 bra 	$L__BB0_95;

	abs.f32 	%f727, %f154;
	abs.f32 	%f728, %f156;
	setp.gt.f32 	%p68, %f727, %f728;
	selp.f32 	%f729, %f157, 0f00000000, %p68;
	selp.f32 	%f730, %f154, %f158, %p68;
	selp.f32 	%f731, 0f00000000, %f155, %p68;
	mul.f32 	%f732, %f730, %f730;
	fma.rn.f32 	%f733, %f729, %f729, %f732;
	fma.rn.f32 	%f734, %f731, %f731, %f733;
	sqrt.rn.f32 	%f735, %f734;
	rcp.rn.f32 	%f736, %f735;
	mov.f32 	%f1427, 0f3F800000;
	mul.f32 	%f168, %f729, %f736;
	mul.f32 	%f169, %f730, %f736;
	mul.f32 	%f170, %f731, %f736;
	setp.ltu.f32 	%p69, %f545, 0f00000000;
	mov.f32 	%f1428, %f1427;
	mov.f32 	%f1429, %f1427;
	@%p69 bra 	$L__BB0_94;

	sqrt.rn.f32 	%f171, %f1;
	mul.f32 	%f172, %f2, 0f40C90FDB;
	mul.f32 	%f737, %f172, 0f3F22F983;
	cvt.rni.s32.f32 	%r765, %f737;
	cvt.rn.f32.s32 	%f738, %r765;
	mov.f32 	%f739, 0fBFC90FDA;
	fma.rn.f32 	%f740, %f738, %f739, %f172;
	mov.f32 	%f741, 0fB3A22168;
	fma.rn.f32 	%f742, %f738, %f741, %f740;
	mov.f32 	%f743, 0fA7C234C5;
	fma.rn.f32 	%f1424, %f738, %f743, %f742;
	abs.f32 	%f174, %f172;
	setp.ltu.f32 	%p70, %f174, 0f47CE4780;
	mov.u32 	%r761, %r765;
	mov.f32 	%f1421, %f1424;
	@%p70 bra 	$L__BB0_77;

	setp.eq.f32 	%p71, %f174, 0f7F800000;
	@%p71 bra 	$L__BB0_76;
	bra.uni 	$L__BB0_71;

$L__BB0_76:
	mov.f32 	%f746, 0f00000000;
	mul.rn.f32 	%f1421, %f172, %f746;
	mov.u32 	%r761, 0;
	bra.uni 	$L__BB0_77;

$L__BB0_34:
	abs.f32 	%f549, %f1389;
	abs.f32 	%f550, %f1391;
	setp.gt.f32 	%p35, %f549, %f550;
	neg.f32 	%f551, %f1390;
	selp.f32 	%f552, %f551, 0f00000000, %p35;
	neg.f32 	%f553, %f1391;
	selp.f32 	%f554, %f1389, %f553, %p35;
	selp.f32 	%f555, 0f00000000, %f1390, %p35;
	mul.f32 	%f556, %f554, %f554;
	fma.rn.f32 	%f557, %f552, %f552, %f556;
	fma.rn.f32 	%f558, %f555, %f555, %f557;
	sqrt.rn.f32 	%f559, %f558;
	rcp.rn.f32 	%f560, %f559;
	mul.f32 	%f102, %f552, %f560;
	mul.f32 	%f103, %f554, %f560;
	mul.f32 	%f104, %f555, %f560;
	sqrt.rn.f32 	%f105, %f1;
	mul.f32 	%f106, %f2, 0f40C90FDB;
	mul.f32 	%f561, %f106, 0f3F22F983;
	cvt.rni.s32.f32 	%r757, %f561;
	cvt.rn.f32.s32 	%f562, %r757;
	mov.f32 	%f563, 0fBFC90FDA;
	fma.rn.f32 	%f564, %f562, %f563, %f106;
	mov.f32 	%f565, 0fB3A22168;
	fma.rn.f32 	%f566, %f562, %f565, %f564;
	mov.f32 	%f567, 0fA7C234C5;
	fma.rn.f32 	%f1405, %f562, %f567, %f566;
	abs.f32 	%f108, %f106;
	setp.ltu.f32 	%p36, %f108, 0f47CE4780;
	mov.u32 	%r753, %r757;
	mov.f32 	%f1402, %f1405;
	@%p36 bra 	$L__BB0_42;

	setp.eq.f32 	%p37, %f108, 0f7F800000;
	@%p37 bra 	$L__BB0_41;
	bra.uni 	$L__BB0_36;

$L__BB0_41:
	mov.f32 	%f570, 0f00000000;
	mul.rn.f32 	%f1402, %f106, %f570;
	mov.u32 	%r753, 0;
	bra.uni 	$L__BB0_42;

$L__BB0_36:
	mov.b32 	%r44, %f106;
	bfe.u32 	%r325, %r44, 23, 8;
	add.s32 	%r45, %r325, -128;
	shl.b32 	%r326, %r44, 8;
	or.b32  	%r46, %r326, -2147483648;
	shr.u32 	%r47, %r45, 5;
	mov.u64 	%rd169, 0;
	mov.u32 	%r750, 0;
	mov.u64 	%rd168, __cudart_i2opi_f;
	mov.u64 	%rd167, %rd1;

$L__BB0_37:
	.pragma "nounroll";
	ld.global.nc.u32 	%r327, [%rd168];
	mad.wide.u32 	%rd97, %r327, %r46, %rd169;
	shr.u64 	%rd169, %rd97, 32;
	st.local.u32 	[%rd167], %rd97;
	add.s64 	%rd168, %rd168, 4;
	add.s64 	%rd167, %rd167, 4;
	add.s32 	%r750, %r750, 1;
	setp.ne.s32 	%p38, %r750, 6;
	@%p38 bra 	$L__BB0_37;

	st.local.u32 	[%rd1+24], %rd169;
	mov.u32 	%r328, 4;
	sub.s32 	%r50, %r328, %r47;
	mov.u32 	%r329, 6;
	sub.s32 	%r330, %r329, %r47;
	mul.wide.s32 	%rd98, %r330, 4;
	add.s64 	%rd99, %rd1, %rd98;
	ld.local.u32 	%r751, [%rd99];
	ld.local.u32 	%r752, [%rd99+-4];
	and.b32  	%r53, %r45, 31;
	setp.eq.s32 	%p39, %r53, 0;
	@%p39 bra 	$L__BB0_40;

	mov.u32 	%r331, 32;
	sub.s32 	%r332, %r331, %r53;
	shr.u32 	%r333, %r752, %r332;
	shl.b32 	%r334, %r751, %r53;
	add.s32 	%r751, %r333, %r334;
	mul.wide.s32 	%rd100, %r50, 4;
	add.s64 	%rd101, %rd1, %rd100;
	ld.local.u32 	%r335, [%rd101];
	shr.u32 	%r336, %r335, %r332;
	shl.b32 	%r337, %r752, %r53;
	add.s32 	%r752, %r336, %r337;

$L__BB0_40:
	and.b32  	%r338, %r44, -2147483648;
	shr.u32 	%r339, %r752, 30;
	shl.b32 	%r340, %r751, 2;
	or.b32  	%r341, %r339, %r340;
	shr.u32 	%r342, %r341, 31;
	shr.u32 	%r343, %r751, 30;
	add.s32 	%r344, %r342, %r343;
	neg.s32 	%r345, %r344;
	setp.eq.s32 	%p40, %r338, 0;
	selp.b32 	%r753, %r344, %r345, %p40;
	setp.ne.s32 	%p41, %r342, 0;
	xor.b32  	%r346, %r338, -2147483648;
	selp.b32 	%r347, %r346, %r338, %p41;
	selp.b32 	%r348, -1, 0, %p41;
	xor.b32  	%r349, %r341, %r348;
	shl.b32 	%r350, %r752, 2;
	xor.b32  	%r351, %r350, %r348;
	cvt.u64.u32 	%rd102, %r349;
	cvt.u64.u32 	%rd103, %r351;
	bfi.b64 	%rd104, %rd102, %rd103, 32, 32;
	cvt.rn.f64.s64 	%fd5, %rd104;
	mul.f64 	%fd6, %fd5, 0d3BF921FB54442D19;
	cvt.rn.f32.f64 	%f568, %fd6;
	setp.eq.s32 	%p42, %r347, 0;
	neg.f32 	%f569, %f568;
	selp.f32 	%f1402, %f568, %f569, %p42;

$L__BB0_42:
	add.s32 	%r60, %r753, 1;
	and.b32  	%r61, %r60, 1;
	setp.eq.s32 	%p43, %r61, 0;
	selp.f32 	%f112, %f1402, 0f3F800000, %p43;
	mul.rn.f32 	%f113, %f1402, %f1402;
	mov.f32 	%f1403, 0fB94D4153;
	@%p43 bra 	$L__BB0_44;

	mov.f32 	%f572, 0fBAB607ED;
	mov.f32 	%f573, 0f37CBAC00;
	fma.rn.f32 	%f1403, %f573, %f113, %f572;

$L__BB0_44:
	selp.f32 	%f574, 0f3C0885E4, 0f3D2AAABB, %p43;
	fma.rn.f32 	%f575, %f1403, %f113, %f574;
	selp.f32 	%f576, 0fBE2AAAA8, 0fBEFFFFFF, %p43;
	fma.rn.f32 	%f577, %f575, %f113, %f576;
	mov.f32 	%f578, 0f00000000;
	fma.rn.f32 	%f579, %f113, %f112, %f578;
	fma.rn.f32 	%f1404, %f577, %f579, %f112;
	and.b32  	%r353, %r60, 2;
	setp.eq.s32 	%p45, %r353, 0;
	@%p45 bra 	$L__BB0_46;

	mov.f32 	%f581, 0fBF800000;
	fma.rn.f32 	%f1404, %f1404, %f581, %f578;

$L__BB0_46:
	@%p36 bra 	$L__BB0_54;

	setp.eq.f32 	%p47, %f108, 0f7F800000;
	@%p47 bra 	$L__BB0_53;
	bra.uni 	$L__BB0_48;

$L__BB0_53:
	mov.f32 	%f584, 0f00000000;
	mul.rn.f32 	%f1405, %f106, %f584;
	mov.u32 	%r757, 0;
	bra.uni 	$L__BB0_54;

$L__BB0_48:
	mov.b32 	%r62, %f106;
	bfe.u32 	%r355, %r62, 23, 8;
	add.s32 	%r63, %r355, -128;
	shl.b32 	%r356, %r62, 8;
	or.b32  	%r64, %r356, -2147483648;
	shr.u32 	%r65, %r63, 5;
	mov.u64 	%rd172, 0;
	mov.u32 	%r754, 0;
	mov.u64 	%rd171, __cudart_i2opi_f;
	mov.u64 	%rd170, %rd1;

$L__BB0_49:
	.pragma "nounroll";
	ld.global.nc.u32 	%r357, [%rd171];
	mad.wide.u32 	%rd107, %r357, %r64, %rd172;
	shr.u64 	%rd172, %rd107, 32;
	st.local.u32 	[%rd170], %rd107;
	add.s64 	%rd171, %rd171, 4;
	add.s64 	%rd170, %rd170, 4;
	add.s32 	%r754, %r754, 1;
	setp.ne.s32 	%p48, %r754, 6;
	@%p48 bra 	$L__BB0_49;

	st.local.u32 	[%rd1+24], %rd172;
	mov.u32 	%r358, 4;
	sub.s32 	%r68, %r358, %r65;
	mov.u32 	%r359, 6;
	sub.s32 	%r360, %r359, %r65;
	mul.wide.s32 	%rd108, %r360, 4;
	add.s64 	%rd109, %rd1, %rd108;
	ld.local.u32 	%r755, [%rd109];
	ld.local.u32 	%r756, [%rd109+-4];
	and.b32  	%r71, %r63, 31;
	setp.eq.s32 	%p49, %r71, 0;
	@%p49 bra 	$L__BB0_52;

	mov.u32 	%r361, 32;
	sub.s32 	%r362, %r361, %r71;
	shr.u32 	%r363, %r756, %r362;
	shl.b32 	%r364, %r755, %r71;
	add.s32 	%r755, %r363, %r364;
	mul.wide.s32 	%rd110, %r68, 4;
	add.s64 	%rd111, %rd1, %rd110;
	ld.local.u32 	%r365, [%rd111];
	shr.u32 	%r366, %r365, %r362;
	shl.b32 	%r367, %r756, %r71;
	add.s32 	%r756, %r366, %r367;

$L__BB0_52:
	and.b32  	%r368, %r62, -2147483648;
	shr.u32 	%r369, %r756, 30;
	shl.b32 	%r370, %r755, 2;
	or.b32  	%r371, %r369, %r370;
	shr.u32 	%r372, %r371, 31;
	shr.u32 	%r373, %r755, 30;
	add.s32 	%r374, %r372, %r373;
	neg.s32 	%r375, %r374;
	setp.eq.s32 	%p50, %r368, 0;
	selp.b32 	%r757, %r374, %r375, %p50;
	setp.ne.s32 	%p51, %r372, 0;
	xor.b32  	%r376, %r368, -2147483648;
	selp.b32 	%r377, %r376, %r368, %p51;
	selp.b32 	%r378, -1, 0, %p51;
	xor.b32  	%r379, %r371, %r378;
	shl.b32 	%r380, %r756, 2;
	xor.b32  	%r381, %r380, %r378;
	cvt.u64.u32 	%rd112, %r379;
	cvt.u64.u32 	%rd113, %r381;
	bfi.b64 	%rd114, %rd112, %rd113, 32, 32;
	cvt.rn.f64.s64 	%fd7, %rd114;
	mul.f64 	%fd8, %fd7, 0d3BF921FB54442D19;
	cvt.rn.f32.f64 	%f582, %fd8;
	setp.eq.s32 	%p52, %r377, 0;
	neg.f32 	%f583, %f582;
	selp.f32 	%f1405, %f582, %f583, %p52;

$L__BB0_54:
	mul.f32 	%f122, %f105, %f1404;
	and.b32  	%r78, %r757, 1;
	setp.eq.s32 	%p53, %r78, 0;
	selp.f32 	%f123, %f1405, 0f3F800000, %p53;
	mul.rn.f32 	%f124, %f1405, %f1405;
	mov.f32 	%f1406, 0fB94D4153;
	@%p53 bra 	$L__BB0_56;

	mov.f32 	%f586, 0fBAB607ED;
	mov.f32 	%f587, 0f37CBAC00;
	fma.rn.f32 	%f1406, %f587, %f124, %f586;

$L__BB0_56:
	selp.f32 	%f588, 0f3C0885E4, 0f3D2AAABB, %p53;
	fma.rn.f32 	%f589, %f1406, %f124, %f588;
	selp.f32 	%f590, 0fBE2AAAA8, 0fBEFFFFFF, %p53;
	fma.rn.f32 	%f591, %f589, %f124, %f590;
	mov.f32 	%f1414, 0f00000000;
	fma.rn.f32 	%f593, %f124, %f123, %f1414;
	fma.rn.f32 	%f1407, %f591, %f593, %f123;
	and.b32  	%r383, %r757, 2;
	setp.eq.s32 	%p55, %r383, 0;
	@%p55 bra 	$L__BB0_58;

	mov.f32 	%f594, 0f00000000;
	mov.f32 	%f595, 0fBF800000;
	fma.rn.f32 	%f1407, %f1407, %f595, %f594;

$L__BB0_58:
	mul.f32 	%f599, %f122, %f122;
	mov.f32 	%f1408, 0f3F800000;
	sub.f32 	%f601, %f1408, %f599;
	mul.f32 	%f602, %f105, %f1407;
	mul.f32 	%f603, %f602, %f602;
	sub.f32 	%f604, %f601, %f603;
	max.f32 	%f605, %f1414, %f604;
	sqrt.rn.f32 	%f606, %f605;
	mul.f32 	%f607, %f102, %f602;
	mul.f32 	%f608, %f103, %f602;
	mul.f32 	%f609, %f104, %f602;
	mul.f32 	%f610, %f1391, %f103;
	mul.f32 	%f611, %f1390, %f104;
	sub.f32 	%f612, %f610, %f611;
	fma.rn.f32 	%f613, %f612, %f122, %f607;
	mul.f32 	%f614, %f1389, %f104;
	mul.f32 	%f615, %f1391, %f102;
	sub.f32 	%f616, %f614, %f615;
	fma.rn.f32 	%f617, %f616, %f122, %f608;
	mul.f32 	%f618, %f1390, %f102;
	mul.f32 	%f619, %f1389, %f103;
	sub.f32 	%f620, %f618, %f619;
	fma.rn.f32 	%f621, %f620, %f122, %f609;
	fma.rn.f32 	%f130, %f1389, %f606, %f613;
	fma.rn.f32 	%f131, %f1390, %f606, %f617;
	fma.rn.f32 	%f132, %f1391, %f606, %f621;
	setp.leu.f32 	%p56, %f131, 0f00000000;
	setp.neu.f32 	%p57, %f545, 0f00000000;
	and.pred  	%p58, %p57, %p56;
	mov.f32 	%f1415, %f1414;
	mov.f32 	%f1416, %f1414;
	@%p58 bra 	$L__BB0_62;

	mul.f32 	%f634, %f70, 0f3456BF95;
	abs.f32 	%f635, %f634;
	mul.f32 	%f636, %f71, 0f3456BF95;
	abs.f32 	%f637, %f636;
	mul.f32 	%f638, %f72, 0f3456BF95;
	abs.f32 	%f639, %f638;
	max.f32 	%f640, %f635, %f637;
	max.f32 	%f641, %f640, %f639;
	mov.f32 	%f642, 0f38D1B717;
	max.f32 	%f628, %f641, %f642;
	ld.const.u64 	%rd115, [params+64];
	mov.f32 	%f629, 0f6C4ECB8F;
	mov.f32 	%f630, 0f00000000;
	mov.u32 	%r420, 2;
	mov.u32 	%r421, 1;
	mov.u32 	%r422, 3;
	mov.u32 	%r425, 1065353216;
	mov.u32 	%r454, 0;
	// begin inline asm
	call(%r384,%r385,%r386,%r387,%r388,%r389,%r390,%r391,%r392,%r393,%r394,%r395,%r396,%r397,%r398,%r399,%r400,%r401,%r402,%r403,%r404,%r405,%r406,%r407,%r408,%r409,%r410,%r411,%r412,%r413,%r414,%r415),_optix_trace_typed_32,(%r454,%rd115,%f70,%f71,%f72,%f130,%f131,%f132,%f628,%f629,%f630,%r421,%r454,%r421,%r420,%r421,%r422,%r425,%r425,%r425,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454);
	// end inline asm
	setp.leu.f32 	%p59, %f542, 0f00000000;
	mov.f32 	%f1409, %f1408;
	mov.f32 	%f1410, %f1408;
	@%p59 bra 	$L__BB0_61;

	neg.f32 	%f643, %f132;
	neg.f32 	%f644, %f130;
	neg.f32 	%f645, %f131;
	tex.cube.v4.f32.f32 	{%f1410, %f1409, %f1408, %f646}, [%rd17, {%f643, %f645, %f644, %f644}];

$L__BB0_61:
	mov.b32 	%f647, %r384;
	fma.rn.f32 	%f1414, %f1410, %f647, 0f00000000;
	mov.b32 	%f648, %r385;
	fma.rn.f32 	%f1415, %f1409, %f648, 0f00000000;
	mov.b32 	%f649, %r386;
	fma.rn.f32 	%f1416, %f1408, %f649, 0f00000000;

$L__BB0_62:
	@%p32 bra 	$L__BB0_64;

	add.f32 	%f650, %f541, 0fBF800000;
	mul.f32 	%f651, %f650, 0f42C80000;
	mul.f32 	%f1414, %f651, %f1414;
	mul.f32 	%f1415, %f651, %f1415;
	mul.f32 	%f1416, %f651, %f1416;

$L__BB0_64:
	mul.f32 	%f652, %f546, %f1414;
	mul.f32 	%f1459, %f652, %f91;
	mul.f32 	%f653, %f547, %f1415;
	mul.f32 	%f1460, %f653, %f91;
	mul.f32 	%f654, %f548, %f1416;
	mul.f32 	%f1461, %f654, %f91;
	bra.uni 	$L__BB0_96;

$L__BB0_71:
	mov.b32 	%r112, %f172;
	bfe.u32 	%r456, %r112, 23, 8;
	add.s32 	%r113, %r456, -128;
	shl.b32 	%r457, %r112, 8;
	or.b32  	%r114, %r457, -2147483648;
	shr.u32 	%r115, %r113, 5;
	mov.u64 	%rd175, 0;
	mov.u32 	%r758, 0;
	mov.u64 	%rd174, __cudart_i2opi_f;
	mov.u64 	%rd173, %rd1;

$L__BB0_72:
	.pragma "nounroll";
	ld.global.nc.u32 	%r458, [%rd174];
	mad.wide.u32 	%rd118, %r458, %r114, %rd175;
	shr.u64 	%rd175, %rd118, 32;
	st.local.u32 	[%rd173], %rd118;
	add.s64 	%rd174, %rd174, 4;
	add.s64 	%rd173, %rd173, 4;
	add.s32 	%r758, %r758, 1;
	setp.ne.s32 	%p72, %r758, 6;
	@%p72 bra 	$L__BB0_72;

	st.local.u32 	[%rd1+24], %rd175;
	mov.u32 	%r459, 4;
	sub.s32 	%r118, %r459, %r115;
	mov.u32 	%r460, 6;
	sub.s32 	%r461, %r460, %r115;
	mul.wide.s32 	%rd119, %r461, 4;
	add.s64 	%rd120, %rd1, %rd119;
	ld.local.u32 	%r759, [%rd120];
	ld.local.u32 	%r760, [%rd120+-4];
	and.b32  	%r121, %r113, 31;
	setp.eq.s32 	%p73, %r121, 0;
	@%p73 bra 	$L__BB0_75;

	mov.u32 	%r462, 32;
	sub.s32 	%r463, %r462, %r121;
	shr.u32 	%r464, %r760, %r463;
	shl.b32 	%r465, %r759, %r121;
	add.s32 	%r759, %r464, %r465;
	mul.wide.s32 	%rd121, %r118, 4;
	add.s64 	%rd122, %rd1, %rd121;
	ld.local.u32 	%r466, [%rd122];
	shr.u32 	%r467, %r466, %r463;
	shl.b32 	%r468, %r760, %r121;
	add.s32 	%r760, %r467, %r468;

$L__BB0_75:
	and.b32  	%r469, %r112, -2147483648;
	shr.u32 	%r470, %r760, 30;
	shl.b32 	%r471, %r759, 2;
	or.b32  	%r472, %r470, %r471;
	shr.u32 	%r473, %r472, 31;
	shr.u32 	%r474, %r759, 30;
	add.s32 	%r475, %r473, %r474;
	neg.s32 	%r476, %r475;
	setp.eq.s32 	%p74, %r469, 0;
	selp.b32 	%r761, %r475, %r476, %p74;
	setp.ne.s32 	%p75, %r473, 0;
	xor.b32  	%r477, %r469, -2147483648;
	selp.b32 	%r478, %r477, %r469, %p75;
	selp.b32 	%r479, -1, 0, %p75;
	xor.b32  	%r480, %r472, %r479;
	shl.b32 	%r481, %r760, 2;
	xor.b32  	%r482, %r481, %r479;
	cvt.u64.u32 	%rd123, %r480;
	cvt.u64.u32 	%rd124, %r482;
	bfi.b64 	%rd125, %rd123, %rd124, 32, 32;
	cvt.rn.f64.s64 	%fd9, %rd125;
	mul.f64 	%fd10, %fd9, 0d3BF921FB54442D19;
	cvt.rn.f32.f64 	%f744, %fd10;
	setp.eq.s32 	%p76, %r478, 0;
	neg.f32 	%f745, %f744;
	selp.f32 	%f1421, %f744, %f745, %p76;

$L__BB0_77:
	add.s32 	%r128, %r761, 1;
	and.b32  	%r129, %r128, 1;
	setp.eq.s32 	%p77, %r129, 0;
	selp.f32 	%f178, %f1421, 0f3F800000, %p77;
	mul.rn.f32 	%f179, %f1421, %f1421;
	mov.f32 	%f1422, 0fB94D4153;
	@%p77 bra 	$L__BB0_79;

	mov.f32 	%f748, 0fBAB607ED;
	mov.f32 	%f749, 0f37CBAC00;
	fma.rn.f32 	%f1422, %f749, %f179, %f748;

$L__BB0_79:
	selp.f32 	%f750, 0f3C0885E4, 0f3D2AAABB, %p77;
	fma.rn.f32 	%f751, %f1422, %f179, %f750;
	selp.f32 	%f752, 0fBE2AAAA8, 0fBEFFFFFF, %p77;
	fma.rn.f32 	%f753, %f751, %f179, %f752;
	mov.f32 	%f754, 0f00000000;
	fma.rn.f32 	%f755, %f179, %f178, %f754;
	fma.rn.f32 	%f1423, %f753, %f755, %f178;
	and.b32  	%r484, %r128, 2;
	setp.eq.s32 	%p79, %r484, 0;
	@%p79 bra 	$L__BB0_81;

	mov.f32 	%f757, 0fBF800000;
	fma.rn.f32 	%f1423, %f1423, %f757, %f754;

$L__BB0_81:
	@%p70 bra 	$L__BB0_89;

	setp.eq.f32 	%p81, %f174, 0f7F800000;
	@%p81 bra 	$L__BB0_88;
	bra.uni 	$L__BB0_83;

$L__BB0_88:
	mov.f32 	%f760, 0f00000000;
	mul.rn.f32 	%f1424, %f172, %f760;
	mov.u32 	%r765, 0;
	bra.uni 	$L__BB0_89;

$L__BB0_83:
	mov.b32 	%r130, %f172;
	bfe.u32 	%r486, %r130, 23, 8;
	add.s32 	%r131, %r486, -128;
	shl.b32 	%r487, %r130, 8;
	or.b32  	%r132, %r487, -2147483648;
	shr.u32 	%r133, %r131, 5;
	mov.u64 	%rd178, 0;
	mov.u32 	%r762, 0;
	mov.u64 	%rd177, __cudart_i2opi_f;
	mov.u64 	%rd176, %rd1;

$L__BB0_84:
	.pragma "nounroll";
	ld.global.nc.u32 	%r488, [%rd177];
	mad.wide.u32 	%rd128, %r488, %r132, %rd178;
	shr.u64 	%rd178, %rd128, 32;
	st.local.u32 	[%rd176], %rd128;
	add.s64 	%rd177, %rd177, 4;
	add.s64 	%rd176, %rd176, 4;
	add.s32 	%r762, %r762, 1;
	setp.ne.s32 	%p82, %r762, 6;
	@%p82 bra 	$L__BB0_84;

	st.local.u32 	[%rd1+24], %rd178;
	mov.u32 	%r489, 4;
	sub.s32 	%r136, %r489, %r133;
	mov.u32 	%r490, 6;
	sub.s32 	%r491, %r490, %r133;
	mul.wide.s32 	%rd129, %r491, 4;
	add.s64 	%rd130, %rd1, %rd129;
	ld.local.u32 	%r763, [%rd130];
	ld.local.u32 	%r764, [%rd130+-4];
	and.b32  	%r139, %r131, 31;
	setp.eq.s32 	%p83, %r139, 0;
	@%p83 bra 	$L__BB0_87;

	mov.u32 	%r492, 32;
	sub.s32 	%r493, %r492, %r139;
	shr.u32 	%r494, %r764, %r493;
	shl.b32 	%r495, %r763, %r139;
	add.s32 	%r763, %r494, %r495;
	mul.wide.s32 	%rd131, %r136, 4;
	add.s64 	%rd132, %rd1, %rd131;
	ld.local.u32 	%r496, [%rd132];
	shr.u32 	%r497, %r496, %r493;
	shl.b32 	%r498, %r764, %r139;
	add.s32 	%r764, %r497, %r498;

$L__BB0_87:
	and.b32  	%r499, %r130, -2147483648;
	shr.u32 	%r500, %r764, 30;
	shl.b32 	%r501, %r763, 2;
	or.b32  	%r502, %r500, %r501;
	shr.u32 	%r503, %r502, 31;
	shr.u32 	%r504, %r763, 30;
	add.s32 	%r505, %r503, %r504;
	neg.s32 	%r506, %r505;
	setp.eq.s32 	%p84, %r499, 0;
	selp.b32 	%r765, %r505, %r506, %p84;
	setp.ne.s32 	%p85, %r503, 0;
	xor.b32  	%r507, %r499, -2147483648;
	selp.b32 	%r508, %r507, %r499, %p85;
	selp.b32 	%r509, -1, 0, %p85;
	xor.b32  	%r510, %r502, %r509;
	shl.b32 	%r511, %r764, 2;
	xor.b32  	%r512, %r511, %r509;
	cvt.u64.u32 	%rd133, %r510;
	cvt.u64.u32 	%rd134, %r512;
	bfi.b64 	%rd135, %rd133, %rd134, 32, 32;
	cvt.rn.f64.s64 	%fd11, %rd135;
	mul.f64 	%fd12, %fd11, 0d3BF921FB54442D19;
	cvt.rn.f32.f64 	%f758, %fd12;
	setp.eq.s32 	%p86, %r508, 0;
	neg.f32 	%f759, %f758;
	selp.f32 	%f1424, %f758, %f759, %p86;

$L__BB0_89:
	mul.f32 	%f188, %f171, %f1423;
	and.b32  	%r146, %r765, 1;
	setp.eq.s32 	%p87, %r146, 0;
	selp.f32 	%f189, %f1424, 0f3F800000, %p87;
	mul.rn.f32 	%f190, %f1424, %f1424;
	mov.f32 	%f1425, 0fB94D4153;
	@%p87 bra 	$L__BB0_91;

	mov.f32 	%f762, 0fBAB607ED;
	mov.f32 	%f763, 0f37CBAC00;
	fma.rn.f32 	%f1425, %f763, %f190, %f762;

$L__BB0_91:
	selp.f32 	%f764, 0f3C0885E4, 0f3D2AAABB, %p87;
	fma.rn.f32 	%f765, %f1425, %f190, %f764;
	selp.f32 	%f766, 0fBE2AAAA8, 0fBEFFFFFF, %p87;
	fma.rn.f32 	%f767, %f765, %f190, %f766;
	mov.f32 	%f768, 0f00000000;
	fma.rn.f32 	%f769, %f190, %f189, %f768;
	fma.rn.f32 	%f1426, %f767, %f769, %f189;
	and.b32  	%r514, %r765, 2;
	setp.eq.s32 	%p89, %r514, 0;
	@%p89 bra 	$L__BB0_93;

	mov.f32 	%f771, 0fBF800000;
	fma.rn.f32 	%f1426, %f1426, %f771, %f768;

$L__BB0_93:
	mul.f32 	%f781, %f188, %f188;
	mov.f32 	%f782, 0f3F800000;
	sub.f32 	%f783, %f782, %f781;
	mul.f32 	%f784, %f171, %f1426;
	mul.f32 	%f785, %f784, %f784;
	sub.f32 	%f786, %f783, %f785;
	max.f32 	%f787, %f768, %f786;
	sqrt.rn.f32 	%f788, %f787;
	mul.f32 	%f789, %f168, %f784;
	mul.f32 	%f790, %f169, %f784;
	mul.f32 	%f791, %f170, %f784;
	mul.f32 	%f792, %f155, %f170;
	mul.f32 	%f793, %f156, %f169;
	sub.f32 	%f794, %f793, %f792;
	fma.rn.f32 	%f795, %f794, %f188, %f789;
	mul.f32 	%f796, %f156, %f168;
	mul.f32 	%f797, %f154, %f170;
	sub.f32 	%f798, %f797, %f796;
	fma.rn.f32 	%f799, %f798, %f188, %f790;
	mul.f32 	%f800, %f154, %f169;
	mul.f32 	%f801, %f155, %f168;
	sub.f32 	%f802, %f801, %f800;
	fma.rn.f32 	%f803, %f802, %f188, %f791;
	fma.rn.f32 	%f804, %f154, %f788, %f795;
	fma.rn.f32 	%f805, %f155, %f788, %f799;
	fma.rn.f32 	%f806, %f156, %f788, %f803;
	add.f32 	%f807, %f154, %f804;
	add.f32 	%f808, %f155, %f805;
	add.f32 	%f809, %f156, %f806;
	mul.f32 	%f810, %f545, %f807;
	mul.f32 	%f811, %f545, %f808;
	mul.f32 	%f812, %f545, %f809;
	sub.f32 	%f813, %f810, %f154;
	sub.f32 	%f814, %f811, %f155;
	sub.f32 	%f815, %f812, %f156;
	mul.f32 	%f816, %f814, %f814;
	fma.rn.f32 	%f817, %f813, %f813, %f816;
	fma.rn.f32 	%f818, %f815, %f815, %f817;
	sqrt.rn.f32 	%f819, %f818;
	rcp.rn.f32 	%f820, %f819;
	mul.f32 	%f775, %f820, %f813;
	mul.f32 	%f776, %f820, %f814;
	mul.f32 	%f777, %f820, %f815;
	mul.f32 	%f821, %f70, 0f3456BF95;
	abs.f32 	%f822, %f821;
	mul.f32 	%f823, %f71, 0f3456BF95;
	abs.f32 	%f824, %f823;
	mul.f32 	%f825, %f72, 0f3456BF95;
	abs.f32 	%f826, %f825;
	max.f32 	%f827, %f822, %f824;
	max.f32 	%f828, %f827, %f826;
	mov.f32 	%f829, 0f38D1B717;
	max.f32 	%f778, %f828, %f829;
	ld.const.u64 	%rd136, [params+64];
	mov.f32 	%f779, 0f6C4ECB8F;
	mov.u32 	%r551, 2;
	mov.u32 	%r552, 1;
	mov.u32 	%r553, 3;
	mov.u32 	%r556, 1065353216;
	mov.u32 	%r585, 0;
	// begin inline asm
	call(%r515,%r516,%r517,%r518,%r519,%r520,%r521,%r522,%r523,%r524,%r525,%r526,%r527,%r528,%r529,%r530,%r531,%r532,%r533,%r534,%r535,%r536,%r537,%r538,%r539,%r540,%r541,%r542,%r543,%r544,%r545,%r546),_optix_trace_typed_32,(%r585,%rd136,%f70,%f71,%f72,%f775,%f776,%f777,%f778,%f779,%f768,%r552,%r585,%r552,%r551,%r552,%r553,%r556,%r556,%r556,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585);
	// end inline asm
	mov.b32 	%f1427, %r515;
	mov.b32 	%f1428, %r516;
	mov.b32 	%f1429, %r517;

$L__BB0_94:
	mul.f32 	%f830, %f541, 0f42C80000;
	mul.f32 	%f831, %f159, %f1427;
	mul.f32 	%f832, %f830, %f831;
	mul.f32 	%f833, %f159, %f1428;
	mul.f32 	%f834, %f830, %f833;
	mul.f32 	%f835, %f159, %f1429;
	mul.f32 	%f836, %f830, %f835;
	setp.gt.s32 	%p90, %r5, 0;
	selp.f32 	%f837, %f832, %f831, %p90;
	selp.f32 	%f838, %f834, %f833, %p90;
	selp.f32 	%f839, %f836, %f835, %p90;
	mul.f32 	%f840, %f546, %f1417;
	mul.f32 	%f841, %f547, %f1418;
	mul.f32 	%f842, %f548, %f1419;
	mul.f32 	%f1432, %f842, %f839;
	mul.f32 	%f1431, %f841, %f838;
	mul.f32 	%f1430, %f840, %f837;

$L__BB0_95:
	mul.f32 	%f1459, %f1430, %f91;
	mul.f32 	%f1460, %f1431, %f91;
	mul.f32 	%f1461, %f1432, %f91;

$L__BB0_96:
	ld.const.u32 	%r586, [params+204];
	setp.eq.s32 	%p91, %r586, 0;
	mov.u16 	%rs16, 0;
	@%p91 bra 	$L__BB0_126;

	ld.const.f32 	%f843, [params+308];
	sub.f32 	%f844, %f70, %f843;
	ld.const.v2.f32 	{%f845, %f846}, [params+312];
	sub.f32 	%f849, %f71, %f845;
	sub.f32 	%f850, %f72, %f846;
	ld.const.u64 	%rd137, [params+232];
	tex.cube.v4.u32.f32 	{%r147, %r148, %r149, %r150}, [%rd137, {%f844, %f849, %f850, %f850}];
	setp.eq.s32 	%p92, %r148, 0;
	@%p92 bra 	$L__BB0_126;

	cvt.rn.f32.u32 	%f214, %r148;
	mul.f32 	%f852, %f3, %f214;
	cvt.rzi.u32.f32 	%r587, %f852;
	add.s32 	%r588, %r148, -1;
	min.u32 	%r589, %r587, %r588;
	add.s32 	%r590, %r589, %r147;
	ld.const.u64 	%rd138, [params+240];
	cvta.to.global.u64 	%rd139, %rd138;
	mul.wide.s32 	%rd140, %r590, 4;
	add.s64 	%rd141, %rd139, %rd140;
	ld.const.u64 	%rd142, [params+216];
	cvta.to.global.u64 	%rd143, %rd142;
	ld.global.u32 	%r591, [%rd141];
	mul.wide.u32 	%rd144, %r591, 112;
	add.s64 	%rd145, %rd143, %rd144;
	ld.global.v4.f32 	{%f853, %f854, %f855, %f856}, [%rd145];
	ld.global.v4.f32 	{%f857, %f858, %f859, %f860}, [%rd145+16];
	ld.global.v4.f32 	{%f1443, %f1444, %f1445, %f866}, [%rd145+32];
	ld.global.v4.f32 	{%f867, %f868, %f869, %f1442}, [%rd145+48];
	ld.global.v4.f32 	{%f871, %f872, %f873, %f874}, [%rd145+64];
	ld.global.v4.u32 	{%r592, %r593, %r594, %r595}, [%rd145+80];
	mov.b32 	%f233, %r592;
	mov.b32 	%f234, %r593;
	mov.b32 	%f235, %r594;
	ld.global.u64 	%rd42, [%rd145+96];
	sub.f32 	%f236, %f854, %f70;
	sub.f32 	%f237, %f855, %f71;
	sub.f32 	%f238, %f856, %f72;
	mul.f32 	%f875, %f237, %f237;
	fma.rn.f32 	%f876, %f236, %f236, %f875;
	fma.rn.f32 	%f877, %f238, %f238, %f876;
	sqrt.rn.f32 	%f878, %f877;
	rcp.rn.f32 	%f879, %f878;
	mul.f32 	%f1439, %f236, %f879;
	mul.f32 	%f1440, %f237, %f879;
	mul.f32 	%f1441, %f238, %f879;
	mul.f32 	%f242, %f878, %f858;
	mul.f32 	%f243, %f878, %f860;
	mov.f32 	%f883, 0f40800000;
	abs.f32 	%f245, %f243;
	setp.lt.f32 	%p93, %f245, 0f00800000;
	mul.f32 	%f885, %f245, 0f4B800000;
	selp.f32 	%f886, %f885, %f245, %p93;
	selp.f32 	%f887, 0fC3170000, 0fC2FE0000, %p93;
	mov.b32 	%r599, %f886;
	and.b32  	%r600, %r599, 8388607;
	or.b32  	%r601, %r600, 1065353216;
	mov.b32 	%f888, %r601;
	shr.u32 	%r602, %r599, 23;
	cvt.rn.f32.u32 	%f889, %r602;
	add.f32 	%f890, %f887, %f889;
	setp.gt.f32 	%p94, %f888, 0f3FB504F3;
	mul.f32 	%f891, %f888, 0f3F000000;
	add.f32 	%f892, %f890, 0f3F800000;
	selp.f32 	%f893, %f892, %f890, %p94;
	selp.f32 	%f894, %f891, %f888, %p94;
	add.f32 	%f895, %f894, 0fBF800000;
	add.f32 	%f896, %f894, 0f3F800000;
	rcp.approx.ftz.f32 	%f897, %f896;
	add.f32 	%f898, %f895, %f895;
	mul.f32 	%f899, %f898, %f897;
	mul.f32 	%f900, %f899, %f899;
	mov.f32 	%f901, 0f3C4CAF63;
	mov.f32 	%f902, 0f3B18F0FE;
	fma.rn.f32 	%f903, %f902, %f900, %f901;
	mov.f32 	%f904, 0f3DAAAABD;
	fma.rn.f32 	%f905, %f903, %f900, %f904;
	mul.rn.f32 	%f906, %f905, %f900;
	mul.rn.f32 	%f907, %f906, %f899;
	sub.f32 	%f908, %f895, %f899;
	add.f32 	%f909, %f908, %f908;
	neg.f32 	%f910, %f899;
	fma.rn.f32 	%f911, %f910, %f895, %f909;
	mul.rn.f32 	%f912, %f897, %f911;
	add.f32 	%f913, %f907, %f899;
	sub.f32 	%f914, %f899, %f913;
	add.f32 	%f915, %f907, %f914;
	add.f32 	%f916, %f912, %f915;
	add.f32 	%f917, %f913, %f916;
	sub.f32 	%f918, %f913, %f917;
	add.f32 	%f919, %f916, %f918;
	mov.f32 	%f920, 0f3F317200;
	mul.rn.f32 	%f921, %f893, %f920;
	mov.f32 	%f922, 0f35BFBE8E;
	mul.rn.f32 	%f923, %f893, %f922;
	add.f32 	%f924, %f921, %f917;
	sub.f32 	%f925, %f921, %f924;
	add.f32 	%f926, %f917, %f925;
	add.f32 	%f927, %f919, %f926;
	add.f32 	%f928, %f923, %f927;
	add.f32 	%f929, %f924, %f928;
	sub.f32 	%f930, %f924, %f929;
	add.f32 	%f931, %f928, %f930;
	mul.rn.f32 	%f932, %f883, %f929;
	neg.f32 	%f933, %f932;
	fma.rn.f32 	%f934, %f883, %f929, %f933;
	fma.rn.f32 	%f935, %f883, %f931, %f934;
	mov.f32 	%f936, 0f00000000;
	fma.rn.f32 	%f937, %f936, %f929, %f935;
	add.rn.f32 	%f938, %f932, %f937;
	neg.f32 	%f939, %f938;
	add.rn.f32 	%f940, %f932, %f939;
	add.rn.f32 	%f941, %f940, %f937;
	mov.b32 	%r603, %f938;
	setp.eq.s32 	%p95, %r603, 1118925336;
	add.s32 	%r604, %r603, -1;
	mov.b32 	%f942, %r604;
	add.f32 	%f943, %f941, 0f37000000;
	selp.f32 	%f246, %f943, %f941, %p95;
	selp.f32 	%f944, %f942, %f938, %p95;
	mov.f32 	%f945, 0f3FB8AA3B;
	mul.rn.f32 	%f946, %f944, %f945;
	cvt.rzi.f32.f32 	%f947, %f946;
	abs.f32 	%f948, %f947;
	setp.gt.f32 	%p96, %f948, 0f42FC0000;
	mov.b32 	%r605, %f947;
	and.b32  	%r606, %r605, -2147483648;
	or.b32  	%r607, %r606, 1123811328;
	mov.b32 	%f949, %r607;
	selp.f32 	%f950, %f949, %f947, %p96;
	mov.f32 	%f951, 0fBF317218;
	fma.rn.f32 	%f952, %f950, %f951, %f944;
	mov.f32 	%f953, 0f3102E308;
	fma.rn.f32 	%f954, %f950, %f953, %f952;
	mul.f32 	%f955, %f954, 0f3FB8AA3B;
	add.f32 	%f956, %f950, 0f4B40007F;
	mov.b32 	%r608, %f956;
	shl.b32 	%r609, %r608, 23;
	mov.b32 	%f957, %r609;
	ex2.approx.ftz.f32 	%f958, %f955;
	mul.f32 	%f247, %f958, %f957;
	setp.eq.f32 	%p97, %f247, 0f7F800000;
	mov.f32 	%f1436, 0f7F800000;
	@%p97 bra 	$L__BB0_100;

	fma.rn.f32 	%f1436, %f247, %f246, %f247;

$L__BB0_100:
	mov.f32 	%f1370, 0f40000000;
	cvt.rzi.f32.f32 	%f1369, %f1370;
	add.f32 	%f1368, %f1369, %f1369;
	mov.f32 	%f1367, 0f40800000;
	sub.f32 	%f1366, %f1367, %f1368;
	abs.f32 	%f1365, %f1366;
	setp.lt.f32 	%p98, %f243, 0f00000000;
	setp.eq.f32 	%p99, %f1365, 0f3F800000;
	and.pred  	%p1, %p98, %p99;
	setp.eq.f32 	%p100, %f243, 0f00000000;
	@%p100 bra 	$L__BB0_104;
	bra.uni 	$L__BB0_101;

$L__BB0_104:
	add.f32 	%f963, %f243, %f243;
	selp.f32 	%f1438, %f963, 0f00000000, %p99;
	bra.uni 	$L__BB0_105;

$L__BB0_101:
	mov.b32 	%r610, %f1436;
	xor.b32  	%r611, %r610, -2147483648;
	mov.b32 	%f959, %r611;
	selp.f32 	%f1438, %f959, %f1436, %p1;
	setp.geu.f32 	%p101, %f243, 0f00000000;
	@%p101 bra 	$L__BB0_105;

	mov.f32 	%f960, 0f40800000;
	cvt.rzi.f32.f32 	%f961, %f960;
	setp.eq.f32 	%p102, %f961, 0f40800000;
	@%p102 bra 	$L__BB0_105;

	mov.f32 	%f1438, 0f7FFFFFFF;

$L__BB0_105:
	abs.f32 	%f1371, %f243;
	add.f32 	%f964, %f1371, 0f40800000;
	mov.b32 	%r612, %f964;
	setp.lt.s32 	%p104, %r612, 2139095040;
	@%p104 bra 	$L__BB0_110;

	abs.f32 	%f1375, %f243;
	setp.gtu.f32 	%p105, %f1375, 0f7F800000;
	@%p105 bra 	$L__BB0_109;
	bra.uni 	$L__BB0_107;

$L__BB0_109:
	add.f32 	%f1438, %f243, 0f40800000;
	bra.uni 	$L__BB0_110;

$L__BB0_107:
	abs.f32 	%f1376, %f243;
	setp.neu.f32 	%p106, %f1376, 0f7F800000;
	@%p106 bra 	$L__BB0_110;

	selp.f32 	%f1438, 0fFF800000, 0f7F800000, %p1;

$L__BB0_110:
	mov.f32 	%f965, 0f3F800000;
	sub.f32 	%f966, %f965, %f1438;
	setp.eq.f32 	%p107, %f243, 0f3F800000;
	selp.f32 	%f967, 0f00000000, %f966, %p107;
	cvt.sat.f32.f32 	%f968, %f967;
	fma.rn.f32 	%f969, %f242, %f242, %f859;
	div.rn.f32 	%f1446, %f968, %f969;
	mul.f32 	%f970, %f1390, %f1440;
	fma.rn.f32 	%f971, %f1389, %f1439, %f970;
	fma.rn.f32 	%f257, %f1391, %f1441, %f971;
	setp.eq.f32 	%p108, %f853, 0f3F800000;
	@%p108 bra 	$L__BB0_116;
	bra.uni 	$L__BB0_111;

$L__BB0_116:
	setp.eq.s64 	%p112, %rd42, 0;
	@%p112 bra 	$L__BB0_120;

	mul.f32 	%f994, %f233, %f1439;
	mul.f32 	%f995, %f234, %f1440;
	neg.f32 	%f996, %f995;
	sub.f32 	%f997, %f996, %f994;
	mul.f32 	%f998, %f235, %f1441;
	sub.f32 	%f262, %f997, %f998;
	setp.geu.f32 	%p113, %f1442, 0f00000000;
	@%p113 bra 	$L__BB0_119;

	sub.f32 	%f1374, %f856, %f72;
	sub.f32 	%f1373, %f854, %f70;
	sub.f32 	%f1372, %f855, %f71;
	mul.f32 	%f999, %f234, %f1372;
	fma.rn.f32 	%f1000, %f233, %f1373, %f999;
	fma.rn.f32 	%f1001, %f235, %f1374, %f1000;
	rcp.rn.f32 	%f1002, %f1001;
	mul.f32 	%f1439, %f1373, %f1002;
	mul.f32 	%f1440, %f1372, %f1002;
	mul.f32 	%f1441, %f1374, %f1002;
	neg.f32 	%f1442, %f1442;

$L__BB0_119:
	setp.gt.f32 	%p114, %f262, 0f00000000;
	selp.f32 	%f1003, 0f3F800000, 0f00000000, %p114;
	mov.f32 	%f1004, 0f3F800000;
	mul.f32 	%f1005, %f868, %f1440;
	fma.rn.f32 	%f1006, %f867, %f1439, %f1005;
	mul.f32 	%f1007, %f872, %f1440;
	fma.rn.f32 	%f1008, %f871, %f1439, %f1007;
	fma.rn.f32 	%f1009, %f869, %f1441, %f1006;
	fma.rn.f32 	%f1010, %f873, %f1441, %f1008;
	fma.rn.f32 	%f1011, %f1442, %f1009, 0f3F000000;
	sub.f32 	%f1012, %f1004, %f1011;
	fma.rn.f32 	%f1013, %f1442, %f1010, 0f3F000000;
	tex.2d.v4.f32.f32 	{%f1014, %f1015, %f1016, %f1017}, [%rd42, {%f1012, %f1013}];
	mul.f32 	%f1018, %f1003, %f1014;
	mul.f32 	%f1019, %f1003, %f1015;
	mul.f32 	%f1020, %f1003, %f1016;
	mul.f32 	%f1443, %f1443, %f1018;
	mul.f32 	%f1444, %f1444, %f1019;
	mul.f32 	%f1445, %f1445, %f1020;
	bra.uni 	$L__BB0_120;

$L__BB0_111:
	setp.eq.f32 	%p109, %f853, 0f40000000;
	@%p109 bra 	$L__BB0_114;
	bra.uni 	$L__BB0_112;

$L__BB0_114:
	setp.eq.s64 	%p111, %rd42, 0;
	@%p111 bra 	$L__BB0_120;

	mul.f32 	%f981, %f868, %f1440;
	fma.rn.f32 	%f982, %f867, %f1439, %f981;
	mul.f32 	%f983, %f872, %f1440;
	fma.rn.f32 	%f984, %f871, %f1439, %f983;
	mul.f32 	%f985, %f234, %f1440;
	fma.rn.f32 	%f986, %f233, %f1439, %f985;
	fma.rn.f32 	%f987, %f869, %f1441, %f982;
	fma.rn.f32 	%f988, %f873, %f1441, %f984;
	fma.rn.f32 	%f989, %f235, %f1441, %f986;
	tex.cube.v4.f32.f32 	{%f990, %f991, %f992, %f993}, [%rd42, {%f987, %f988, %f989, %f989}];
	mul.f32 	%f1443, %f1443, %f990;
	mul.f32 	%f1444, %f1444, %f991;
	mul.f32 	%f1445, %f1445, %f992;
	bra.uni 	$L__BB0_120;

$L__BB0_112:
	setp.neu.f32 	%p110, %f853, 0f40800000;
	@%p110 bra 	$L__BB0_120;

	mul.f32 	%f972, %f233, %f1439;
	mul.f32 	%f973, %f234, %f1440;
	neg.f32 	%f974, %f973;
	sub.f32 	%f975, %f974, %f972;
	mul.f32 	%f976, %f235, %f1441;
	sub.f32 	%f977, %f975, %f976;
	fma.rn.f32 	%f978, %f866, %f977, %f1442;
	cvt.sat.f32.f32 	%f979, %f978;
	mul.f32 	%f980, %f979, %f979;
	mul.f32 	%f1446, %f1446, %f980;

$L__BB0_120:
	max.f32 	%f1024, %f1443, %f1444;
	max.f32 	%f1025, %f1024, %f1445;
	cvt.sat.f32.f32 	%f1026, %f257;
	mul.f32 	%f278, %f1026, %f1446;
	mul.f32 	%f1027, %f278, %f1025;
	setp.lt.f32 	%p115, %f1027, 0f3727C5AC;
	mov.f32 	%f1450, 0f00000000;
	mov.f32 	%f1451, %f1450;
	mov.f32 	%f1452, %f1450;
	@%p115 bra 	$L__BB0_124;

	setp.lt.s32 	%p116, %r595, 1;
	mov.f32 	%f1447, 0f3F800000;
	mov.f32 	%f1448, %f1447;
	mov.f32 	%f1449, %f1447;
	@%p116 bra 	$L__BB0_123;

	fma.rn.f32 	%f1040, %f1, 0f40000000, 0fBF800000;
	fma.rn.f32 	%f1041, %f2, 0f40000000, 0fBF800000;
	fma.rn.f32 	%f1042, %f3, 0f40000000, 0fBF800000;
	fma.rn.f32 	%f1043, %f1040, %f857, %f854;
	fma.rn.f32 	%f1044, %f1041, %f857, %f855;
	fma.rn.f32 	%f1045, %f1042, %f857, %f856;
	sub.f32 	%f1046, %f1043, %f70;
	sub.f32 	%f1047, %f1044, %f71;
	sub.f32 	%f1048, %f1045, %f72;
	mul.f32 	%f1049, %f1047, %f1047;
	fma.rn.f32 	%f1050, %f1046, %f1046, %f1049;
	fma.rn.f32 	%f1051, %f1048, %f1048, %f1050;
	sqrt.rn.f32 	%f1038, %f1051;
	rcp.rn.f32 	%f1052, %f1038;
	mul.f32 	%f1034, %f1046, %f1052;
	mul.f32 	%f1035, %f1047, %f1052;
	mul.f32 	%f1036, %f1048, %f1052;
	mul.f32 	%f1053, %f70, 0f3456BF95;
	abs.f32 	%f1054, %f1053;
	mul.f32 	%f1055, %f71, 0f3456BF95;
	abs.f32 	%f1056, %f1055;
	mul.f32 	%f1057, %f72, 0f3456BF95;
	abs.f32 	%f1058, %f1057;
	max.f32 	%f1059, %f1054, %f1056;
	max.f32 	%f1060, %f1059, %f1058;
	mov.f32 	%f1061, 0f38D1B717;
	max.f32 	%f1037, %f1060, %f1061;
	ld.const.u64 	%rd146, [params+64];
	mov.f32 	%f1039, 0f00000000;
	mov.u32 	%r649, 2;
	mov.u32 	%r650, 1;
	mov.u32 	%r651, 3;
	mov.u32 	%r654, 1065353216;
	mov.u32 	%r683, 0;
	// begin inline asm
	call(%r613,%r614,%r615,%r616,%r617,%r618,%r619,%r620,%r621,%r622,%r623,%r624,%r625,%r626,%r627,%r628,%r629,%r630,%r631,%r632,%r633,%r634,%r635,%r636,%r637,%r638,%r639,%r640,%r641,%r642,%r643,%r644),_optix_trace_typed_32,(%r683,%rd146,%f70,%f71,%f72,%f1034,%f1035,%f1036,%f1037,%f1038,%f1039,%r650,%r683,%r650,%r649,%r650,%r651,%r654,%r654,%r654,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683);
	// end inline asm
	mov.b32 	%f1447, %r613;
	mov.b32 	%f1448, %r614;
	mov.b32 	%f1449, %r615;

$L__BB0_123:
	ld.const.u32 	%r740, [params+340];
	mul.f32 	%f1062, %f278, %f1447;
	mul.f32 	%f1063, %f874, %f1062;
	mul.f32 	%f1064, %f278, %f1448;
	mul.f32 	%f1065, %f874, %f1064;
	mul.f32 	%f1066, %f278, %f1449;
	mul.f32 	%f1067, %f874, %f1066;
	setp.gt.s32 	%p117, %r740, 0;
	selp.f32 	%f1068, %f1063, %f1062, %p117;
	selp.f32 	%f1069, %f1065, %f1064, %p117;
	selp.f32 	%f1070, %f1067, %f1066, %p117;
	mul.f32 	%f1452, %f1445, %f1070;
	mul.f32 	%f1451, %f1444, %f1069;
	mul.f32 	%f1450, %f1443, %f1068;

$L__BB0_124:
	mov.u16 	%rs16, 0;
	fma.rn.f32 	%f1459, %f1450, %f214, %f1459;
	fma.rn.f32 	%f1460, %f1451, %f214, %f1460;
	fma.rn.f32 	%f1461, %f1452, %f214, %f1461;

$L__BB0_126:
	ld.const.u32 	%r741, [params+340];
	setp.eq.s32 	%p176, %r741, 0;
	abs.f32 	%f1080, %f1459;
	setp.le.f32 	%p119, %f1080, 0f7F800000;
	selp.f32 	%f1081, %f1459, 0f00000000, %p119;
	abs.f32 	%f1082, %f1460;
	setp.le.f32 	%p120, %f1082, 0f7F800000;
	selp.f32 	%f1083, %f1460, 0f00000000, %p120;
	abs.f32 	%f1084, %f1461;
	setp.le.f32 	%p121, %f1084, 0f7F800000;
	selp.f32 	%f1085, %f1461, 0f00000000, %p121;
	fma.rn.f32 	%f1465, %f1456, %f1081, %f1453;
	fma.rn.f32 	%f1466, %f1457, %f1083, %f1454;
	fma.rn.f32 	%f1467, %f1458, %f1085, %f1455;
	st.global.f32 	[%rd15], %f1456;
	st.global.f32 	[%rd15+4], %f1457;
	st.global.f32 	[%rd15+8], %f1458;
	ld.const.u64 	%rd147, [params+96];
	cvta.to.global.u64 	%rd148, %rd147;
	ld.const.u32 	%r684, [params+88];
	mad.lo.s32 	%r685, %r684, %r156, %r155;
	mul.wide.u32 	%rd149, %r685, 12;
	add.s64 	%rd43, %rd148, %rd149;
	@%p176 bra 	$L__BB0_128;

	ld.global.f32 	%f1086, [%rd43];
	add.f32 	%f1465, %f1465, %f1086;
	ld.global.f32 	%f1087, [%rd43+4];
	add.f32 	%f1466, %f1466, %f1087;
	ld.global.f32 	%f1088, [%rd43+8];
	add.f32 	%f1467, %f1467, %f1088;
	bra.uni 	$L__BB0_133;

$L__BB0_128:
	setp.eq.s16 	%p123, %rs16, 0;
	ld.const.u32 	%r153, [params+368];
	setp.lt.s32 	%p124, %r153, 0;
	or.pred  	%p125, %p123, %p124;
	@%p125 bra 	$L__BB0_133;

	ld.const.u64 	%rd150, [params+208];
	cvta.to.global.u64 	%rd151, %rd150;
	mul.wide.s32 	%rd152, %r153, 64;
	add.s64 	%rd153, %rd151, %rd152;
	ld.global.v4.f32 	{%f1089, %f1090, %f1091, %f1092}, [%rd153+16];
	ld.global.u64 	%rd44, [%rd153+48];
	setp.neu.f32 	%p126, %f1089, 0f00000000;
	setp.leu.f32 	%p127, %f1384, 0f00000000;
	and.pred  	%p128, %p127, %p126;
	@%p128 bra 	$L__BB0_133;

	setp.eq.s64 	%p129, %rd44, 0;
	mov.f32 	%f1462, 0f3F800000;
	mov.f32 	%f1463, %f1462;
	mov.f32 	%f1464, %f1462;
	@%p129 bra 	$L__BB0_132;

	neg.f32 	%f1096, %f1385;
	neg.f32 	%f1097, %f1383;
	neg.f32 	%f1098, %f1384;
	tex.cube.v4.f32.f32 	{%f1464, %f1463, %f1462, %f1099}, [%rd44, {%f1096, %f1098, %f1097, %f1097}];

$L__BB0_132:
	mul.f32 	%f1465, %f1090, %f1464;
	mul.f32 	%f1466, %f1091, %f1463;
	mul.f32 	%f1467, %f1092, %f1462;

$L__BB0_133:
	st.global.f32 	[%rd43], %f1465;
	st.global.f32 	[%rd43+4], %f1466;
	st.global.f32 	[%rd43+8], %f1467;
	ld.const.u64 	%rd154, [params+112];
	cvta.to.global.u64 	%rd155, %rd154;
	ld.const.u32 	%r686, [params+104];
	mad.lo.s32 	%r687, %r686, %r156, %r155;
	mul.wide.u32 	%rd156, %r687, 12;
	add.s64 	%rd45, %rd155, %rd156;
	ld.const.v2.u32 	{%r688, %r689}, [params+344];
	mov.b32 	%f1100, %r689;
	ld.global.f32 	%f1101, [%rd45];
	sub.f32 	%f1102, %f1465, %f1101;
	ld.global.f32 	%f1103, [%rd45+4];
	sub.f32 	%f1104, %f1466, %f1103;
	ld.global.f32 	%f1105, [%rd45+8];
	sub.f32 	%f1106, %f1467, %f1105;
	fma.rn.f32 	%f325, %f1102, %f1100, %f1101;
	fma.rn.f32 	%f326, %f1104, %f1100, %f1103;
	fma.rn.f32 	%f327, %f1106, %f1100, %f1105;
	setp.eq.s32 	%p130, %r688, 0;
	@%p130 bra 	$L__BB0_135;

	st.global.f32 	[%rd45], %f325;
	st.global.f32 	[%rd45+4], %f326;
	st.global.f32 	[%rd45+8], %f327;

$L__BB0_135:
	not.b32 	%r692, %r156;
	add.s32 	%r154, %r159, %r692;
	ld.const.f32 	%f1108, [params+324];
	mul.f32 	%f328, %f325, %f1108;
	mul.f32 	%f329, %f326, %f1108;
	mul.f32 	%f330, %f327, %f1108;
	mov.f32 	%f1109, 0f3E68BA2E;
	cvt.rzi.f32.f32 	%f1110, %f1109;
	add.f32 	%f1111, %f1110, %f1110;
	mov.f32 	%f1112, 0f3EE8BA2E;
	sub.f32 	%f1113, %f1112, %f1111;
	abs.f32 	%f331, %f1113;
	abs.f32 	%f332, %f328;
	setp.lt.f32 	%p131, %f332, 0f00800000;
	mul.f32 	%f1114, %f332, 0f4B800000;
	selp.f32 	%f1115, %f1114, %f332, %p131;
	selp.f32 	%f1116, 0fC3170000, 0fC2FE0000, %p131;
	mov.b32 	%r693, %f1115;
	and.b32  	%r694, %r693, 8388607;
	or.b32  	%r695, %r694, 1065353216;
	mov.b32 	%f1117, %r695;
	shr.u32 	%r696, %r693, 23;
	cvt.rn.f32.u32 	%f1118, %r696;
	add.f32 	%f1119, %f1116, %f1118;
	setp.gt.f32 	%p132, %f1117, 0f3FB504F3;
	mul.f32 	%f1120, %f1117, 0f3F000000;
	add.f32 	%f1121, %f1119, 0f3F800000;
	selp.f32 	%f1122, %f1121, %f1119, %p132;
	selp.f32 	%f1123, %f1120, %f1117, %p132;
	add.f32 	%f1124, %f1123, 0fBF800000;
	add.f32 	%f1125, %f1123, 0f3F800000;
	rcp.approx.ftz.f32 	%f1126, %f1125;
	add.f32 	%f1127, %f1124, %f1124;
	mul.f32 	%f1128, %f1127, %f1126;
	mul.f32 	%f1129, %f1128, %f1128;
	mov.f32 	%f1130, 0f3C4CAF63;
	mov.f32 	%f1131, 0f3B18F0FE;
	fma.rn.f32 	%f1132, %f1131, %f1129, %f1130;
	mov.f32 	%f1133, 0f3DAAAABD;
	fma.rn.f32 	%f1134, %f1132, %f1129, %f1133;
	mul.rn.f32 	%f1135, %f1134, %f1129;
	mul.rn.f32 	%f1136, %f1135, %f1128;
	sub.f32 	%f1137, %f1124, %f1128;
	add.f32 	%f1138, %f1137, %f1137;
	neg.f32 	%f1139, %f1128;
	fma.rn.f32 	%f1140, %f1139, %f1124, %f1138;
	mul.rn.f32 	%f1141, %f1126, %f1140;
	add.f32 	%f1142, %f1136, %f1128;
	sub.f32 	%f1143, %f1128, %f1142;
	add.f32 	%f1144, %f1136, %f1143;
	add.f32 	%f1145, %f1141, %f1144;
	add.f32 	%f1146, %f1142, %f1145;
	sub.f32 	%f1147, %f1142, %f1146;
	add.f32 	%f1148, %f1145, %f1147;
	mov.f32 	%f1149, 0f3F317200;
	mul.rn.f32 	%f1150, %f1122, %f1149;
	mov.f32 	%f1151, 0f35BFBE8E;
	mul.rn.f32 	%f1152, %f1122, %f1151;
	add.f32 	%f1153, %f1150, %f1146;
	sub.f32 	%f1154, %f1150, %f1153;
	add.f32 	%f1155, %f1146, %f1154;
	add.f32 	%f1156, %f1148, %f1155;
	add.f32 	%f1157, %f1152, %f1156;
	add.f32 	%f1158, %f1153, %f1157;
	sub.f32 	%f1159, %f1153, %f1158;
	add.f32 	%f1160, %f1157, %f1159;
	mul.rn.f32 	%f1161, %f1112, %f1158;
	neg.f32 	%f1162, %f1161;
	fma.rn.f32 	%f1163, %f1112, %f1158, %f1162;
	fma.rn.f32 	%f1164, %f1112, %f1160, %f1163;
	mov.f32 	%f1165, 0f00000000;
	fma.rn.f32 	%f1166, %f1165, %f1158, %f1164;
	add.rn.f32 	%f1167, %f1161, %f1166;
	neg.f32 	%f1168, %f1167;
	add.rn.f32 	%f1169, %f1161, %f1168;
	add.rn.f32 	%f1170, %f1169, %f1166;
	mov.b32 	%r697, %f1167;
	setp.eq.s32 	%p133, %r697, 1118925336;
	add.s32 	%r698, %r697, -1;
	mov.b32 	%f1171, %r698;
	add.f32 	%f1172, %f1170, 0f37000000;
	selp.f32 	%f333, %f1172, %f1170, %p133;
	selp.f32 	%f1173, %f1171, %f1167, %p133;
	mov.f32 	%f1174, 0f3FB8AA3B;
	mul.rn.f32 	%f1175, %f1173, %f1174;
	cvt.rzi.f32.f32 	%f1176, %f1175;
	abs.f32 	%f1177, %f1176;
	setp.gt.f32 	%p134, %f1177, 0f42FC0000;
	mov.b32 	%r699, %f1176;
	and.b32  	%r700, %r699, -2147483648;
	or.b32  	%r701, %r700, 1123811328;
	mov.b32 	%f1178, %r701;
	selp.f32 	%f1179, %f1178, %f1176, %p134;
	mov.f32 	%f1180, 0fBF317218;
	fma.rn.f32 	%f1181, %f1179, %f1180, %f1173;
	mov.f32 	%f1182, 0f3102E308;
	fma.rn.f32 	%f1183, %f1179, %f1182, %f1181;
	mul.f32 	%f1184, %f1183, 0f3FB8AA3B;
	add.f32 	%f1185, %f1179, 0f4B40007F;
	mov.b32 	%r702, %f1185;
	shl.b32 	%r703, %r702, 23;
	mov.b32 	%f1186, %r703;
	ex2.approx.ftz.f32 	%f1187, %f1184;
	mul.f32 	%f334, %f1187, %f1186;
	setp.eq.f32 	%p135, %f334, 0f7F800000;
	mov.f32 	%f1468, 0f7F800000;
	@%p135 bra 	$L__BB0_137;

	fma.rn.f32 	%f1468, %f334, %f333, %f334;

$L__BB0_137:
	setp.lt.f32 	%p136, %f328, 0f00000000;
	setp.eq.f32 	%p137, %f331, 0f3F800000;
	and.pred  	%p2, %p136, %p137;
	setp.eq.f32 	%p138, %f328, 0f00000000;
	@%p138 bra 	$L__BB0_141;
	bra.uni 	$L__BB0_138;

$L__BB0_141:
	add.f32 	%f1192, %f328, %f328;
	selp.f32 	%f1470, %f1192, 0f00000000, %p137;
	bra.uni 	$L__BB0_142;

$L__BB0_138:
	mov.b32 	%r704, %f1468;
	xor.b32  	%r705, %r704, -2147483648;
	mov.b32 	%f1188, %r705;
	selp.f32 	%f1470, %f1188, %f1468, %p2;
	setp.geu.f32 	%p139, %f328, 0f00000000;
	@%p139 bra 	$L__BB0_142;

	mov.f32 	%f1189, 0f3EE8BA2E;
	cvt.rzi.f32.f32 	%f1190, %f1189;
	setp.eq.f32 	%p140, %f1190, 0f3EE8BA2E;
	@%p140 bra 	$L__BB0_142;

	mov.f32 	%f1470, 0f7FFFFFFF;

$L__BB0_142:
	add.f32 	%f1193, %f332, 0f3EE8BA2E;
	mov.b32 	%r706, %f1193;
	setp.lt.s32 	%p142, %r706, 2139095040;
	@%p142 bra 	$L__BB0_147;

	setp.gtu.f32 	%p143, %f332, 0f7F800000;
	@%p143 bra 	$L__BB0_146;
	bra.uni 	$L__BB0_144;

$L__BB0_146:
	add.f32 	%f1470, %f328, 0f3EE8BA2E;
	bra.uni 	$L__BB0_147;

$L__BB0_144:
	setp.neu.f32 	%p144, %f332, 0f7F800000;
	@%p144 bra 	$L__BB0_147;

	selp.f32 	%f1470, 0fFF800000, 0f7F800000, %p2;

$L__BB0_147:
	setp.eq.f32 	%p145, %f328, 0f3F800000;
	selp.f32 	%f1195, 0f3F800000, %f1470, %p145;
	cvt.sat.f32.f32 	%f343, %f1195;
	abs.f32 	%f344, %f329;
	setp.lt.f32 	%p146, %f344, 0f00800000;
	mul.f32 	%f1196, %f344, 0f4B800000;
	selp.f32 	%f1197, %f1196, %f344, %p146;
	selp.f32 	%f1198, 0fC3170000, 0fC2FE0000, %p146;
	mov.b32 	%r707, %f1197;
	and.b32  	%r708, %r707, 8388607;
	or.b32  	%r709, %r708, 1065353216;
	mov.b32 	%f1199, %r709;
	shr.u32 	%r710, %r707, 23;
	cvt.rn.f32.u32 	%f1200, %r710;
	add.f32 	%f1201, %f1198, %f1200;
	setp.gt.f32 	%p147, %f1199, 0f3FB504F3;
	mul.f32 	%f1202, %f1199, 0f3F000000;
	add.f32 	%f1203, %f1201, 0f3F800000;
	selp.f32 	%f1204, %f1203, %f1201, %p147;
	selp.f32 	%f1205, %f1202, %f1199, %p147;
	add.f32 	%f1206, %f1205, 0fBF800000;
	add.f32 	%f1207, %f1205, 0f3F800000;
	rcp.approx.ftz.f32 	%f1208, %f1207;
	add.f32 	%f1209, %f1206, %f1206;
	mul.f32 	%f1210, %f1209, %f1208;
	mul.f32 	%f1211, %f1210, %f1210;
	mov.f32 	%f1212, 0f3C4CAF63;
	mov.f32 	%f1213, 0f3B18F0FE;
	fma.rn.f32 	%f1214, %f1213, %f1211, %f1212;
	mov.f32 	%f1215, 0f3DAAAABD;
	fma.rn.f32 	%f1216, %f1214, %f1211, %f1215;
	mul.rn.f32 	%f1217, %f1216, %f1211;
	mul.rn.f32 	%f1218, %f1217, %f1210;
	sub.f32 	%f1219, %f1206, %f1210;
	add.f32 	%f1220, %f1219, %f1219;
	neg.f32 	%f1221, %f1210;
	fma.rn.f32 	%f1222, %f1221, %f1206, %f1220;
	mul.rn.f32 	%f1223, %f1208, %f1222;
	add.f32 	%f1224, %f1218, %f1210;
	sub.f32 	%f1225, %f1210, %f1224;
	add.f32 	%f1226, %f1218, %f1225;
	add.f32 	%f1227, %f1223, %f1226;
	add.f32 	%f1228, %f1224, %f1227;
	sub.f32 	%f1229, %f1224, %f1228;
	add.f32 	%f1230, %f1227, %f1229;
	mov.f32 	%f1231, 0f3F317200;
	mul.rn.f32 	%f1232, %f1204, %f1231;
	mov.f32 	%f1233, 0f35BFBE8E;
	mul.rn.f32 	%f1234, %f1204, %f1233;
	add.f32 	%f1235, %f1232, %f1228;
	sub.f32 	%f1236, %f1232, %f1235;
	add.f32 	%f1237, %f1228, %f1236;
	add.f32 	%f1238, %f1230, %f1237;
	add.f32 	%f1239, %f1234, %f1238;
	add.f32 	%f1240, %f1235, %f1239;
	sub.f32 	%f1241, %f1235, %f1240;
	add.f32 	%f1242, %f1239, %f1241;
	mov.f32 	%f1243, 0f3EE8BA2E;
	mul.rn.f32 	%f1244, %f1243, %f1240;
	neg.f32 	%f1245, %f1244;
	fma.rn.f32 	%f1246, %f1243, %f1240, %f1245;
	fma.rn.f32 	%f1247, %f1243, %f1242, %f1246;
	mov.f32 	%f1248, 0f00000000;
	fma.rn.f32 	%f1249, %f1248, %f1240, %f1247;
	add.rn.f32 	%f1250, %f1244, %f1249;
	neg.f32 	%f1251, %f1250;
	add.rn.f32 	%f1252, %f1244, %f1251;
	add.rn.f32 	%f1253, %f1252, %f1249;
	mov.b32 	%r711, %f1250;
	setp.eq.s32 	%p148, %r711, 1118925336;
	add.s32 	%r712, %r711, -1;
	mov.b32 	%f1254, %r712;
	add.f32 	%f1255, %f1253, 0f37000000;
	selp.f32 	%f345, %f1255, %f1253, %p148;
	selp.f32 	%f1256, %f1254, %f1250, %p148;
	mov.f32 	%f1257, 0f3FB8AA3B;
	mul.rn.f32 	%f1258, %f1256, %f1257;
	cvt.rzi.f32.f32 	%f1259, %f1258;
	abs.f32 	%f1260, %f1259;
	setp.gt.f32 	%p149, %f1260, 0f42FC0000;
	mov.b32 	%r713, %f1259;
	and.b32  	%r714, %r713, -2147483648;
	or.b32  	%r715, %r714, 1123811328;
	mov.b32 	%f1261, %r715;
	selp.f32 	%f1262, %f1261, %f1259, %p149;
	mov.f32 	%f1263, 0fBF317218;
	fma.rn.f32 	%f1264, %f1262, %f1263, %f1256;
	mov.f32 	%f1265, 0f3102E308;
	fma.rn.f32 	%f1266, %f1262, %f1265, %f1264;
	mul.f32 	%f1267, %f1266, 0f3FB8AA3B;
	add.f32 	%f1268, %f1262, 0f4B40007F;
	mov.b32 	%r716, %f1268;
	shl.b32 	%r717, %r716, 23;
	mov.b32 	%f1269, %r717;
	ex2.approx.ftz.f32 	%f1270, %f1267;
	mul.f32 	%f346, %f1270, %f1269;
	setp.eq.f32 	%p150, %f346, 0f7F800000;
	mov.f32 	%f1471, 0f7F800000;
	@%p150 bra 	$L__BB0_149;

	fma.rn.f32 	%f1471, %f346, %f345, %f346;

$L__BB0_149:
	setp.lt.f32 	%p151, %f329, 0f00000000;
	and.pred  	%p3, %p151, %p137;
	setp.eq.f32 	%p153, %f329, 0f00000000;
	@%p153 bra 	$L__BB0_153;
	bra.uni 	$L__BB0_150;

$L__BB0_153:
	add.f32 	%f1275, %f329, %f329;
	selp.f32 	%f1473, %f1275, 0f00000000, %p137;
	bra.uni 	$L__BB0_154;

$L__BB0_150:
	mov.b32 	%r718, %f1471;
	xor.b32  	%r719, %r718, -2147483648;
	mov.b32 	%f1271, %r719;
	selp.f32 	%f1473, %f1271, %f1471, %p3;
	setp.geu.f32 	%p154, %f329, 0f00000000;
	@%p154 bra 	$L__BB0_154;

	mov.f32 	%f1272, 0f3EE8BA2E;
	cvt.rzi.f32.f32 	%f1273, %f1272;
	setp.eq.f32 	%p155, %f1273, 0f3EE8BA2E;
	@%p155 bra 	$L__BB0_154;

	mov.f32 	%f1473, 0f7FFFFFFF;

$L__BB0_154:
	add.f32 	%f1276, %f344, 0f3EE8BA2E;
	mov.b32 	%r720, %f1276;
	setp.lt.s32 	%p157, %r720, 2139095040;
	@%p157 bra 	$L__BB0_159;

	setp.gtu.f32 	%p158, %f344, 0f7F800000;
	@%p158 bra 	$L__BB0_158;
	bra.uni 	$L__BB0_156;

$L__BB0_158:
	add.f32 	%f1473, %f329, 0f3EE8BA2E;
	bra.uni 	$L__BB0_159;

$L__BB0_156:
	setp.neu.f32 	%p159, %f344, 0f7F800000;
	@%p159 bra 	$L__BB0_159;

	selp.f32 	%f1473, 0fFF800000, 0f7F800000, %p3;

$L__BB0_159:
	setp.eq.f32 	%p160, %f329, 0f3F800000;
	selp.f32 	%f1278, 0f3F800000, %f1473, %p160;
	cvt.sat.f32.f32 	%f355, %f1278;
	abs.f32 	%f356, %f330;
	setp.lt.f32 	%p161, %f356, 0f00800000;
	mul.f32 	%f1279, %f356, 0f4B800000;
	selp.f32 	%f1280, %f1279, %f356, %p161;
	selp.f32 	%f1281, 0fC3170000, 0fC2FE0000, %p161;
	mov.b32 	%r721, %f1280;
	and.b32  	%r722, %r721, 8388607;
	or.b32  	%r723, %r722, 1065353216;
	mov.b32 	%f1282, %r723;
	shr.u32 	%r724, %r721, 23;
	cvt.rn.f32.u32 	%f1283, %r724;
	add.f32 	%f1284, %f1281, %f1283;
	setp.gt.f32 	%p162, %f1282, 0f3FB504F3;
	mul.f32 	%f1285, %f1282, 0f3F000000;
	add.f32 	%f1286, %f1284, 0f3F800000;
	selp.f32 	%f1287, %f1286, %f1284, %p162;
	selp.f32 	%f1288, %f1285, %f1282, %p162;
	add.f32 	%f1289, %f1288, 0fBF800000;
	add.f32 	%f1290, %f1288, 0f3F800000;
	rcp.approx.ftz.f32 	%f1291, %f1290;
	add.f32 	%f1292, %f1289, %f1289;
	mul.f32 	%f1293, %f1292, %f1291;
	mul.f32 	%f1294, %f1293, %f1293;
	mov.f32 	%f1295, 0f3C4CAF63;
	mov.f32 	%f1296, 0f3B18F0FE;
	fma.rn.f32 	%f1297, %f1296, %f1294, %f1295;
	mov.f32 	%f1298, 0f3DAAAABD;
	fma.rn.f32 	%f1299, %f1297, %f1294, %f1298;
	mul.rn.f32 	%f1300, %f1299, %f1294;
	mul.rn.f32 	%f1301, %f1300, %f1293;
	sub.f32 	%f1302, %f1289, %f1293;
	add.f32 	%f1303, %f1302, %f1302;
	neg.f32 	%f1304, %f1293;
	fma.rn.f32 	%f1305, %f1304, %f1289, %f1303;
	mul.rn.f32 	%f1306, %f1291, %f1305;
	add.f32 	%f1307, %f1301, %f1293;
	sub.f32 	%f1308, %f1293, %f1307;
	add.f32 	%f1309, %f1301, %f1308;
	add.f32 	%f1310, %f1306, %f1309;
	add.f32 	%f1311, %f1307, %f1310;
	sub.f32 	%f1312, %f1307, %f1311;
	add.f32 	%f1313, %f1310, %f1312;
	mov.f32 	%f1314, 0f3F317200;
	mul.rn.f32 	%f1315, %f1287, %f1314;
	mov.f32 	%f1316, 0f35BFBE8E;
	mul.rn.f32 	%f1317, %f1287, %f1316;
	add.f32 	%f1318, %f1315, %f1311;
	sub.f32 	%f1319, %f1315, %f1318;
	add.f32 	%f1320, %f1311, %f1319;
	add.f32 	%f1321, %f1313, %f1320;
	add.f32 	%f1322, %f1317, %f1321;
	add.f32 	%f1323, %f1318, %f1322;
	sub.f32 	%f1324, %f1318, %f1323;
	add.f32 	%f1325, %f1322, %f1324;
	mov.f32 	%f1326, 0f3EE8BA2E;
	mul.rn.f32 	%f1327, %f1326, %f1323;
	neg.f32 	%f1328, %f1327;
	fma.rn.f32 	%f1329, %f1326, %f1323, %f1328;
	fma.rn.f32 	%f1330, %f1326, %f1325, %f1329;
	mov.f32 	%f1331, 0f00000000;
	fma.rn.f32 	%f1332, %f1331, %f1323, %f1330;
	add.rn.f32 	%f1333, %f1327, %f1332;
	neg.f32 	%f1334, %f1333;
	add.rn.f32 	%f1335, %f1327, %f1334;
	add.rn.f32 	%f1336, %f1335, %f1332;
	mov.b32 	%r725, %f1333;
	setp.eq.s32 	%p163, %r725, 1118925336;
	add.s32 	%r726, %r725, -1;
	mov.b32 	%f1337, %r726;
	add.f32 	%f1338, %f1336, 0f37000000;
	selp.f32 	%f357, %f1338, %f1336, %p163;
	selp.f32 	%f1339, %f1337, %f1333, %p163;
	mov.f32 	%f1340, 0f3FB8AA3B;
	mul.rn.f32 	%f1341, %f1339, %f1340;
	cvt.rzi.f32.f32 	%f1342, %f1341;
	abs.f32 	%f1343, %f1342;
	setp.gt.f32 	%p164, %f1343, 0f42FC0000;
	mov.b32 	%r727, %f1342;
	and.b32  	%r728, %r727, -2147483648;
	or.b32  	%r729, %r728, 1123811328;
	mov.b32 	%f1344, %r729;
	selp.f32 	%f1345, %f1344, %f1342, %p164;
	mov.f32 	%f1346, 0fBF317218;
	fma.rn.f32 	%f1347, %f1345, %f1346, %f1339;
	mov.f32 	%f1348, 0f3102E308;
	fma.rn.f32 	%f1349, %f1345, %f1348, %f1347;
	mul.f32 	%f1350, %f1349, 0f3FB8AA3B;
	add.f32 	%f1351, %f1345, 0f4B40007F;
	mov.b32 	%r730, %f1351;
	shl.b32 	%r731, %r730, 23;
	mov.b32 	%f1352, %r731;
	ex2.approx.ftz.f32 	%f1353, %f1350;
	mul.f32 	%f358, %f1353, %f1352;
	setp.eq.f32 	%p165, %f358, 0f7F800000;
	mov.f32 	%f1474, 0f7F800000;
	@%p165 bra 	$L__BB0_161;

	fma.rn.f32 	%f1474, %f358, %f357, %f358;

$L__BB0_161:
	setp.lt.f32 	%p166, %f330, 0f00000000;
	and.pred  	%p4, %p166, %p137;
	setp.eq.f32 	%p168, %f330, 0f00000000;
	@%p168 bra 	$L__BB0_165;
	bra.uni 	$L__BB0_162;

$L__BB0_165:
	add.f32 	%f1358, %f330, %f330;
	selp.f32 	%f1476, %f1358, 0f00000000, %p137;
	bra.uni 	$L__BB0_166;

$L__BB0_162:
	mov.b32 	%r732, %f1474;
	xor.b32  	%r733, %r732, -2147483648;
	mov.b32 	%f1354, %r733;
	selp.f32 	%f1476, %f1354, %f1474, %p4;
	setp.geu.f32 	%p169, %f330, 0f00000000;
	@%p169 bra 	$L__BB0_166;

	mov.f32 	%f1355, 0f3EE8BA2E;
	cvt.rzi.f32.f32 	%f1356, %f1355;
	setp.eq.f32 	%p170, %f1356, 0f3EE8BA2E;
	@%p170 bra 	$L__BB0_166;

	mov.f32 	%f1476, 0f7FFFFFFF;

$L__BB0_166:
	add.f32 	%f1359, %f356, 0f3EE8BA2E;
	mov.b32 	%r734, %f1359;
	setp.lt.s32 	%p172, %r734, 2139095040;
	@%p172 bra 	$L__BB0_171;

	setp.gtu.f32 	%p173, %f356, 0f7F800000;
	@%p173 bra 	$L__BB0_170;
	bra.uni 	$L__BB0_168;

$L__BB0_170:
	add.f32 	%f1476, %f330, 0f3EE8BA2E;
	bra.uni 	$L__BB0_171;

$L__BB0_168:
	setp.neu.f32 	%p174, %f356, 0f7F800000;
	@%p174 bra 	$L__BB0_171;

	selp.f32 	%f1476, 0fFF800000, 0f7F800000, %p4;

$L__BB0_171:
	setp.eq.f32 	%p175, %f330, 0f3F800000;
	selp.f32 	%f1360, 0f3F800000, %f1476, %p175;
	cvt.sat.f32.f32 	%f1361, %f1360;
	ld.const.u64 	%rd157, [params+80];
	cvta.to.global.u64 	%rd158, %rd157;
	ld.const.u32 	%r735, [params+72];
	mad.lo.s32 	%r736, %r735, %r154, %r155;
	mul.f32 	%f1362, %f343, 0f437F0000;
	cvt.rzi.u32.f32 	%r737, %f1362;
	mul.f32 	%f1363, %f355, 0f437F0000;
	cvt.rzi.u32.f32 	%r738, %f1363;
	mul.f32 	%f1364, %f1361, 0f437F0000;
	cvt.rzi.u32.f32 	%r739, %f1364;
	mul.wide.u32 	%rd159, %r736, 4;
	add.s64 	%rd160, %rd158, %rd159;
	cvt.u16.u32 	%rs11, %r739;
	cvt.u16.u32 	%rs12, %r738;
	cvt.u16.u32 	%rs13, %r737;
	mov.u16 	%rs14, 255;
	st.global.v4.u8 	[%rd160], {%rs13, %rs12, %rs11, %rs14};
	ret;

}

